In [1]:
# As usual, a bit of setup
import time
import numpy as np
import matplotlib.pyplot as plt
from cs682.data_utils import get_CIFAR10_data

import torch
import torch.nn as nn
import torch.optim as optim

import torchvision.datasets as dset
import torchvision.transforms as T

import torch.nn.functional as F 

%matplotlib inline
plt.rcParams['figure.figsize'] = (20.0, 16.0) # set default size of plots
plt.rcParams['image.interpolation'] = 'nearest'
# plt.rcParams['image.cmap'] = 'gray'

# for auto-reloading external modules
# see http://stackoverflow.com/questions/1907993/autoreload-of-modules-in-ipython
%load_ext autoreload
%autoreload 2

def rel_error(x, y):
    """ returns relative error """
    return np.max(np.abs(x - y) / (np.maximum(1e-8, np.abs(x) + np.abs(y))))
In [2]:
# Load the (preprocessed) CIFAR10 data.
unproccessed_data = get_CIFAR10_data(subtract_mean=False)
for k, v in unproccessed_data.items():
  print('%s: ' % k, v.shape)
  if (k.startswith("X")):
       unproccessed_data[k] = unproccessed_data[k] / 255
X_train:  (49000, 3, 32, 32)
y_train:  (49000,)
X_val:  (1000, 3, 32, 32)
y_val:  (1000,)
X_test:  (1000, 3, 32, 32)
y_test:  (1000,)

Preprocess data

Convert images to black and white for X data and use colored images as Y data

In [3]:
# Set Y data as colored images

data = {}

data["y_train"] = unproccessed_data["X_train"]
data["y_val"] = unproccessed_data["X_val"]
data["y_test"] = unproccessed_data["X_test"]

# Convert X data to B/W

def convertToBW(data):
     # Data shape is (N, 3, W, H)
     
     ret = np.zeros(data.shape)
     grayscale = 0.299 * data[:, 0, :, :] + 0.587 * data[:, 1, :, :] + 0.114 * data[:, 2, :, :]
     
     ret[:, 0, :, :] = grayscale
     ret[:, 1, :, :] = grayscale
     ret[:, 2, :, :] = grayscale
     
     return ret

data["X_train"] = convertToBW(unproccessed_data["X_train"]);
data["X_val"] = convertToBW(unproccessed_data["X_val"]);
data["X_test"] = convertToBW(unproccessed_data["X_test"]);

# Create subplots and choose random examples
fig, axs = plt.subplots(5, 2)
idx = np.random.choice(range(data["X_train"].shape[0]), 5)

# Set axis titles
axs[0, 0].title.set_text('X data')
axs[0, 1].title.set_text('Y data')

for i in range(5):
     axs[i, 0].imshow(data["X_train"][idx[i]].transpose(1, 2, 0))
     axs[i, 1].imshow(data["y_train"][idx[i]].transpose(1, 2, 0))

Basic Model

Test basic model by using 1 FC layer

In [4]:
USE_GPU = True

dtype = torch.float32 # we will be using float throughout this tutorial

if USE_GPU and torch.cuda.is_available():
    device = torch.device('cuda')
else:
    device = torch.device('cpu')

# Constant to control how frequently we print train loss
print_every = 100

print('using device:', device)

def flatten(x):
    N = x.shape[0] 
    return x.view(N, -1) 
using device: cpu
In [18]:
batch_size = 100
print_every = 20

def train(model, optimizer, epochs=1, x_train=data["X_train"], y_train=data["y_train"], criterion=nn.MSELoss()):
    """
    Train a model on CIFAR-10 using the PyTorch Module API.
    
    Inputs:
    - model: A PyTorch Module giving the model to train.
    - optimizer: An Optimizer object we will use to train the model
    - epochs: (Optional) A Python integer giving the number of epochs to train for
    
    Returns: Nothing, but prints model accuracies during training.
    """
     
    model = model.to(device=device)  # move the model parameters to CPU/GPU\
     
    for e in range(epochs):
        model.epochsTrained += 1
        print("--- Epoch " + str(e + 1) + " / " + str(epochs) + " - " + str(model.epochsTrained) + " epochs total")
        idx = np.random.choice(range(x_train.shape[0]), batch_size)
        x_batch = torch.from_numpy(x_train[idx])
        y_batch = flatten(torch.from_numpy(y_train[idx]))
                    
        for t in range(x_batch.size()[0]):
            model.train()  # put model to training mode
            x = x_batch[t].to(device=device, dtype=dtype) 
            y = y_batch[t].to(device=device, dtype=dtype)
               
            scores = model(x)
            
            loss = criterion(scores.view(-1), y.view(-1))

            # Zero out all of the gradients for the variables which the optimizer
            # will update.
            optimizer.zero_grad()

            # This is the backwards pass: compute the gradient of the loss with
            # respect to each  parameter of the model.
            loss.backward()

            # Actually update the parameters of the model using the gradients
            # computed by the backwards pass.
            optimizer.step()

            if t % print_every == 0:
                print('Iteration %d, loss = %.4f' % (t, loss.item()))
In [19]:
class BasicNet(nn.Module):
    def __init__(self, input_size):
        super().__init__()
        
        self.epochsTrained = 0
        self.fc = nn.Linear(input_size, input_size)

    def forward(self, x):
        x = x.view(-1)
        scores = self.fc(x)
          
        return scores
In [21]:
learning_rate = 1e-2
model1 = BasicNet(3 * data["X_train"].shape[2] * data["X_train"].shape[3])
optimizer = optim.SGD(model1.parameters(), lr=learning_rate)

train(model1, optimizer, epochs=25)
--- Epoch 1 / 25 - 1 epochs total
Iteration 0, loss = 0.1488
Iteration 20, loss = 0.2187
Iteration 40, loss = 0.4903
Iteration 60, loss = 0.6881
Iteration 80, loss = 0.1929
--- Epoch 2 / 25 - 2 epochs total
Iteration 0, loss = 0.1037
Iteration 20, loss = 0.0865
Iteration 40, loss = 0.0571
Iteration 60, loss = 0.1310
Iteration 80, loss = 0.1437
--- Epoch 3 / 25 - 3 epochs total
Iteration 0, loss = 0.0813
Iteration 20, loss = 0.2574
Iteration 40, loss = 0.0593
Iteration 60, loss = 0.1005
Iteration 80, loss = 0.0389
--- Epoch 4 / 25 - 4 epochs total
Iteration 0, loss = 0.0145
Iteration 20, loss = 0.1109
Iteration 40, loss = 0.0839
Iteration 60, loss = 0.0890
Iteration 80, loss = 0.1745
--- Epoch 5 / 25 - 5 epochs total
Iteration 0, loss = 0.0308
Iteration 20, loss = 0.0375
Iteration 40, loss = 0.1164
Iteration 60, loss = 0.0505
Iteration 80, loss = 0.0474
--- Epoch 6 / 25 - 6 epochs total
Iteration 0, loss = 0.0188
Iteration 20, loss = 0.0376
Iteration 40, loss = 0.0421
Iteration 60, loss = 0.0615
Iteration 80, loss = 0.0739
--- Epoch 7 / 25 - 7 epochs total
Iteration 0, loss = 0.0254
Iteration 20, loss = 0.0462
Iteration 40, loss = 0.0866
Iteration 60, loss = 0.0442
Iteration 80, loss = 0.0398
--- Epoch 8 / 25 - 8 epochs total
Iteration 0, loss = 0.0476
Iteration 20, loss = 0.0264
Iteration 40, loss = 0.0345
Iteration 60, loss = 0.0511
Iteration 80, loss = 0.0583
--- Epoch 9 / 25 - 9 epochs total
Iteration 0, loss = 0.0698
Iteration 20, loss = 0.0462
Iteration 40, loss = 0.0438
Iteration 60, loss = 0.0477
Iteration 80, loss = 0.0605
--- Epoch 10 / 25 - 10 epochs total
Iteration 0, loss = 0.0684
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0425
Iteration 60, loss = 0.0418
Iteration 80, loss = 0.0762
--- Epoch 11 / 25 - 11 epochs total
Iteration 0, loss = 0.0578
Iteration 20, loss = 0.1219
Iteration 40, loss = 0.0485
Iteration 60, loss = 0.0437
Iteration 80, loss = 0.0725
--- Epoch 12 / 25 - 12 epochs total
Iteration 0, loss = 0.1021
Iteration 20, loss = 0.0815
Iteration 40, loss = 0.0393
Iteration 60, loss = 0.0431
Iteration 80, loss = 0.0653
--- Epoch 13 / 25 - 13 epochs total
Iteration 0, loss = 0.0581
Iteration 20, loss = 0.1159
Iteration 40, loss = 0.0406
Iteration 60, loss = 0.0558
Iteration 80, loss = 0.0403
--- Epoch 14 / 25 - 14 epochs total
Iteration 0, loss = 0.0160
Iteration 20, loss = 0.1339
Iteration 40, loss = 0.0924
Iteration 60, loss = 0.0632
Iteration 80, loss = 0.0237
--- Epoch 15 / 25 - 15 epochs total
Iteration 0, loss = 0.0275
Iteration 20, loss = 0.0514
Iteration 40, loss = 0.0580
Iteration 60, loss = 0.0503
Iteration 80, loss = 0.0365
--- Epoch 16 / 25 - 16 epochs total
Iteration 0, loss = 0.0645
Iteration 20, loss = 0.0301
Iteration 40, loss = 0.0662
Iteration 60, loss = 0.0634
Iteration 80, loss = 0.0356
--- Epoch 17 / 25 - 17 epochs total
Iteration 0, loss = 0.0517
Iteration 20, loss = 0.0566
Iteration 40, loss = 0.0724
Iteration 60, loss = 0.0264
Iteration 80, loss = 0.0671
--- Epoch 18 / 25 - 18 epochs total
Iteration 0, loss = 0.0507
Iteration 20, loss = 0.0167
Iteration 40, loss = 0.0526
Iteration 60, loss = 0.0588
Iteration 80, loss = 0.0459
--- Epoch 19 / 25 - 19 epochs total
Iteration 0, loss = 0.0549
Iteration 20, loss = 0.0494
Iteration 40, loss = 0.0355
Iteration 60, loss = 0.0258
Iteration 80, loss = 0.0681
--- Epoch 20 / 25 - 20 epochs total
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0552
Iteration 40, loss = 0.0585
Iteration 60, loss = 0.0344
Iteration 80, loss = 0.0662
--- Epoch 21 / 25 - 21 epochs total
Iteration 0, loss = 0.0338
Iteration 20, loss = 0.0382
Iteration 40, loss = 0.0445
Iteration 60, loss = 0.0495
Iteration 80, loss = 0.1125
--- Epoch 22 / 25 - 22 epochs total
Iteration 0, loss = 0.0905
Iteration 20, loss = 0.0246
Iteration 40, loss = 0.0579
Iteration 60, loss = 0.0920
Iteration 80, loss = 0.0637
--- Epoch 23 / 25 - 23 epochs total
Iteration 0, loss = 0.0438
Iteration 20, loss = 0.0504
Iteration 40, loss = 0.0171
Iteration 60, loss = 0.0454
Iteration 80, loss = 0.0272
--- Epoch 24 / 25 - 24 epochs total
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0197
Iteration 40, loss = 0.0689
Iteration 60, loss = 0.0461
Iteration 80, loss = 0.0629
--- Epoch 25 / 25 - 25 epochs total
Iteration 0, loss = 0.0734
Iteration 20, loss = 0.0574
Iteration 40, loss = 0.0919
Iteration 60, loss = 0.0485
Iteration 80, loss = 0.0501
In [145]:
def testModel(model, n=10, x_test=data["X_test"], y_test=data["y_test"], criterion=nn.MSELoss()):
     model.eval()
     
     # Create subplots and choose random examples
     fig, axs = plt.subplots(n, 3)
     fig.tight_layout()
     fig.set_size_inches(10, 25)
     idx = np.random.choice(range(x_test.shape[0]), n)

     # Set axis titles
     
     for i in range(n):
          sample = x_test[idx[i]]
          x_data = torch.from_numpy(sample).to(device=device, dtype=dtype)
          predicted = model(x_data)
          
          y_data = y_test[idx[i]]
          loss = criterion(predicted.view(3, 32, 32), torch.from_numpy(y_data).to(device=device, dtype=dtype))

          axs[i, 0].title.set_text('X data')
          axs[i, 1].title.set_text('Loss=' + "{:.9f}".format(loss.item()))
          axs[i, 2].title.set_text('Actual')
          
          axs[i, 0].imshow(x_test[idx[i]].transpose(1, 2, 0))
          axs[i, 1].imshow(predicted.view(3, 32, 32).detach().numpy().transpose(1, 2, 0))
          axs[i, 2].imshow(y_data.transpose(1, 2, 0))
          
In [170]:
testModel(model1)
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
In [22]:
class BasicConvNet(nn.Module):
    def __init__(self):
        super().__init__()
        self.epochsTrained = 0
    
        self.conv1 = nn.Conv2d(3, 24, kernel_size=3, stride=1, padding=0) # 24 3x3 filters
        self.conv2 = nn.Conv2d(24, 24, kernel_size=3, stride=1, padding=0) # 24 3x3 filters
        self.conv3 = nn.Conv2d(24, 12, kernel_size=3, stride=1, padding=0) # 12 3x3 filters
        self.fc = nn.Linear(8112, 32 * 32 * 3)

    def forward(self, x):
        x = x.unsqueeze(0)
        scores = F.relu(self.conv1(x));
        scores = F.relu(self.conv2(scores));
        scores = F.relu(self.conv3(scores));
        scores = self.fc(scores.view(-1))
          
        return scores
In [172]:
learning_rate = 1e-2
model2 = BasicConvNet()
optimizer = optim.SGD(model2.parameters(), lr=learning_rate)

train(model2, optimizer, epochs=25, criterion=nn.MSELoss())
--- Epoch 1 / 25 - 1 epochs total
Iteration 0, loss = 0.3250
Iteration 20, loss = 0.1401
Iteration 40, loss = 0.2926
Iteration 60, loss = 0.3218
Iteration 80, loss = 0.2827
--- Epoch 2 / 25 - 2 epochs total
Iteration 0, loss = 0.3426
Iteration 20, loss = 0.1222
Iteration 40, loss = 0.5539
Iteration 60, loss = 0.1707
Iteration 80, loss = 0.3535
--- Epoch 3 / 25 - 3 epochs total
Iteration 0, loss = 0.2681
Iteration 20, loss = 0.2246
Iteration 40, loss = 0.3098
Iteration 60, loss = 0.1848
Iteration 80, loss = 0.3872
--- Epoch 4 / 25 - 4 epochs total
Iteration 0, loss = 0.0420
Iteration 20, loss = 0.2622
Iteration 40, loss = 0.1603
Iteration 60, loss = 0.0840
Iteration 80, loss = 0.1690
--- Epoch 5 / 25 - 5 epochs total
Iteration 0, loss = 0.0431
Iteration 20, loss = 0.1285
Iteration 40, loss = 0.0655
Iteration 60, loss = 0.0661
Iteration 80, loss = 0.0665
--- Epoch 6 / 25 - 6 epochs total
Iteration 0, loss = 0.0418
Iteration 20, loss = 0.0540
Iteration 40, loss = 0.1009
Iteration 60, loss = 0.0712
Iteration 80, loss = 0.0702
--- Epoch 7 / 25 - 7 epochs total
Iteration 0, loss = 0.0361
Iteration 20, loss = 0.0178
Iteration 40, loss = 0.0333
Iteration 60, loss = 0.0257
Iteration 80, loss = 0.0402
--- Epoch 8 / 25 - 8 epochs total
Iteration 0, loss = 0.0361
Iteration 20, loss = 0.0587
Iteration 40, loss = 0.0777
Iteration 60, loss = 0.0482
Iteration 80, loss = 0.0690
--- Epoch 9 / 25 - 9 epochs total
Iteration 0, loss = 0.0463
Iteration 20, loss = 0.0761
Iteration 40, loss = 0.0588
Iteration 60, loss = 0.0356
Iteration 80, loss = 0.0691
--- Epoch 10 / 25 - 10 epochs total
Iteration 0, loss = 0.0794
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0387
Iteration 60, loss = 0.0116
Iteration 80, loss = 0.0259
--- Epoch 11 / 25 - 11 epochs total
Iteration 0, loss = 0.0665
Iteration 20, loss = 0.0568
Iteration 40, loss = 0.0544
Iteration 60, loss = 0.0923
Iteration 80, loss = 0.0191
--- Epoch 12 / 25 - 12 epochs total
Iteration 0, loss = 0.0189
Iteration 20, loss = 0.0431
Iteration 40, loss = 0.0440
Iteration 60, loss = 0.0827
Iteration 80, loss = 0.0411
--- Epoch 13 / 25 - 13 epochs total
Iteration 0, loss = 0.0408
Iteration 20, loss = 0.0383
Iteration 40, loss = 0.0811
Iteration 60, loss = 0.0319
Iteration 80, loss = 0.0371
--- Epoch 14 / 25 - 14 epochs total
Iteration 0, loss = 0.0675
Iteration 20, loss = 0.0269
Iteration 40, loss = 0.0464
Iteration 60, loss = 0.0359
Iteration 80, loss = 0.0777
--- Epoch 15 / 25 - 15 epochs total
Iteration 0, loss = 0.0494
Iteration 20, loss = 0.0465
Iteration 40, loss = 0.0550
Iteration 60, loss = 0.0470
Iteration 80, loss = 0.0217
--- Epoch 16 / 25 - 16 epochs total
Iteration 0, loss = 0.0241
Iteration 20, loss = 0.0531
Iteration 40, loss = 0.0545
Iteration 60, loss = 0.0363
Iteration 80, loss = 0.0274
--- Epoch 17 / 25 - 17 epochs total
Iteration 0, loss = 0.0668
Iteration 20, loss = 0.0375
Iteration 40, loss = 0.0313
Iteration 60, loss = 0.0566
Iteration 80, loss = 0.0603
--- Epoch 18 / 25 - 18 epochs total
Iteration 0, loss = 0.0432
Iteration 20, loss = 0.0534
Iteration 40, loss = 0.0431
Iteration 60, loss = 0.0287
Iteration 80, loss = 0.0745
--- Epoch 19 / 25 - 19 epochs total
Iteration 0, loss = 0.0599
Iteration 20, loss = 0.0335
Iteration 40, loss = 0.0950
Iteration 60, loss = 0.0310
Iteration 80, loss = 0.0671
--- Epoch 20 / 25 - 20 epochs total
Iteration 0, loss = 0.0641
Iteration 20, loss = 0.0458
Iteration 40, loss = 0.0320
Iteration 60, loss = 0.0294
Iteration 80, loss = 0.0455
--- Epoch 21 / 25 - 21 epochs total
Iteration 0, loss = 0.0222
Iteration 20, loss = 0.0361
Iteration 40, loss = 0.0441
Iteration 60, loss = 0.0221
Iteration 80, loss = 0.0387
--- Epoch 22 / 25 - 22 epochs total
Iteration 0, loss = 0.0297
Iteration 20, loss = 0.0431
Iteration 40, loss = 0.0498
Iteration 60, loss = 0.0388
Iteration 80, loss = 0.0436
--- Epoch 23 / 25 - 23 epochs total
Iteration 0, loss = 0.0531
Iteration 20, loss = 0.0676
Iteration 40, loss = 0.0386
Iteration 60, loss = 0.0482
Iteration 80, loss = 0.0523
--- Epoch 24 / 25 - 24 epochs total
Iteration 0, loss = 0.0627
Iteration 20, loss = 0.0386
Iteration 40, loss = 0.0173
Iteration 60, loss = 0.0525
Iteration 80, loss = 0.0631
--- Epoch 25 / 25 - 25 epochs total
Iteration 0, loss = 0.0793
Iteration 20, loss = 0.0748
Iteration 40, loss = 0.0250
Iteration 60, loss = 0.0448
Iteration 80, loss = 0.0378
In [173]:
testModel(model2)
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
In [150]:
class ConvNet(nn.Module):
    def __init__(self):
        super().__init__()
        self.epochsTrained = 0
          
        self.batchnorm48 = nn.BatchNorm2d(24)
        self.batchnorm24 = nn.BatchNorm2d(12)
    
        self.conv1 = nn.Conv2d(3, 24, kernel_size=5, stride=1, padding=0) # 48 3x3 filters
        self.conv2 = nn.Conv2d(24, 24, kernel_size=4, stride=1, padding=0) # 48 3x3 filters
        self.conv3 = nn.Conv2d(24, 12, kernel_size=3, stride=1, padding=0) # 24 3x3 filters
        self.fc = nn.Linear(9420, 32 * 32 * 3)

    def forward(self, x):
        x2 = x.unsqueeze(0)
        scores = self.batchnorm48(F.relu(self.conv1(x2)));
        scores = self.batchnorm48(F.relu(self.conv2(scores)));
        scores = self.batchnorm24(F.relu(self.conv3(scores)));
     
        with_x = torch.cat((scores.view(-1), x.view(-1)), 0)
        scores = self.fc(with_x)
          
        return scores
In [152]:
learning_rate = 1e-2
model3 = ConvNet()
optimizer = optim.SGD(model3.parameters(), lr=learning_rate)

train(model3, optimizer, epochs=50)
--- Epoch 1 / 50 - 1 epochs total
Iteration 0, loss = 0.4640
Iteration 20, loss = 0.6072
Iteration 40, loss = 0.3148
Iteration 60, loss = 0.4069
Iteration 80, loss = 0.4691
--- Epoch 2 / 50 - 2 epochs total
Iteration 0, loss = 0.3967
Iteration 20, loss = 0.2838
Iteration 40, loss = 0.3281
Iteration 60, loss = 0.2043
Iteration 80, loss = 0.2292
--- Epoch 3 / 50 - 3 epochs total
Iteration 0, loss = 0.1746
Iteration 20, loss = 0.2492
Iteration 40, loss = 0.3015
Iteration 60, loss = 0.2115
Iteration 80, loss = 0.1473
--- Epoch 4 / 50 - 4 epochs total
Iteration 0, loss = 0.2002
Iteration 20, loss = 0.1324
Iteration 40, loss = 0.1655
Iteration 60, loss = 0.1047
Iteration 80, loss = 0.1279
--- Epoch 5 / 50 - 5 epochs total
Iteration 0, loss = 0.0658
Iteration 20, loss = 0.1138
Iteration 40, loss = 0.0834
Iteration 60, loss = 0.0691
Iteration 80, loss = 0.1292
--- Epoch 6 / 50 - 6 epochs total
Iteration 0, loss = 0.0616
Iteration 20, loss = 0.0694
Iteration 40, loss = 0.0584
Iteration 60, loss = 0.0816
Iteration 80, loss = 0.0577
--- Epoch 7 / 50 - 7 epochs total
Iteration 0, loss = 0.1324
Iteration 20, loss = 0.0863
Iteration 40, loss = 0.0708
Iteration 60, loss = 0.0754
Iteration 80, loss = 0.0538
--- Epoch 8 / 50 - 8 epochs total
Iteration 0, loss = 0.0802
Iteration 20, loss = 0.0406
Iteration 40, loss = 0.1031
Iteration 60, loss = 0.0588
Iteration 80, loss = 0.0686
--- Epoch 9 / 50 - 9 epochs total
Iteration 0, loss = 0.1652
Iteration 20, loss = 0.0631
Iteration 40, loss = 0.0613
Iteration 60, loss = 0.0669
Iteration 80, loss = 0.0380
--- Epoch 10 / 50 - 10 epochs total
Iteration 0, loss = 0.0784
Iteration 20, loss = 0.0547
Iteration 40, loss = 0.0615
Iteration 60, loss = 0.0810
Iteration 80, loss = 0.0512
--- Epoch 11 / 50 - 11 epochs total
Iteration 0, loss = 0.0210
Iteration 20, loss = 0.0955
Iteration 40, loss = 0.0307
Iteration 60, loss = 0.0660
Iteration 80, loss = 0.0666
--- Epoch 12 / 50 - 12 epochs total
Iteration 0, loss = 0.0620
Iteration 20, loss = 0.0627
Iteration 40, loss = 0.0634
Iteration 60, loss = 0.0754
Iteration 80, loss = 0.0725
--- Epoch 13 / 50 - 13 epochs total
Iteration 0, loss = 0.0478
Iteration 20, loss = 0.0635
Iteration 40, loss = 0.0587
Iteration 60, loss = 0.0401
Iteration 80, loss = 0.0480
--- Epoch 14 / 50 - 14 epochs total
Iteration 0, loss = 0.0413
Iteration 20, loss = 0.0322
Iteration 40, loss = 0.0501
Iteration 60, loss = 0.0378
Iteration 80, loss = 0.0433
--- Epoch 15 / 50 - 15 epochs total
Iteration 0, loss = 0.0587
Iteration 20, loss = 0.0390
Iteration 40, loss = 0.0298
Iteration 60, loss = 0.0265
Iteration 80, loss = 0.0504
--- Epoch 16 / 50 - 16 epochs total
Iteration 0, loss = 0.0631
Iteration 20, loss = 0.0567
Iteration 40, loss = 0.0511
Iteration 60, loss = 0.0489
Iteration 80, loss = 0.0436
--- Epoch 17 / 50 - 17 epochs total
Iteration 0, loss = 0.0723
Iteration 20, loss = 0.0434
Iteration 40, loss = 0.0835
Iteration 60, loss = 0.0518
Iteration 80, loss = 0.1040
--- Epoch 18 / 50 - 18 epochs total
Iteration 0, loss = 0.0448
Iteration 20, loss = 0.0658
Iteration 40, loss = 0.0714
Iteration 60, loss = 0.0629
Iteration 80, loss = 0.0710
--- Epoch 19 / 50 - 19 epochs total
Iteration 0, loss = 0.0361
Iteration 20, loss = 0.0423
Iteration 40, loss = 0.0460
Iteration 60, loss = 0.0197
Iteration 80, loss = 0.0468
--- Epoch 20 / 50 - 20 epochs total
Iteration 0, loss = 0.0461
Iteration 20, loss = 0.0503
Iteration 40, loss = 0.0350
Iteration 60, loss = 0.0665
Iteration 80, loss = 0.0705
--- Epoch 21 / 50 - 21 epochs total
Iteration 0, loss = 0.0350
Iteration 20, loss = 0.0433
Iteration 40, loss = 0.0592
Iteration 60, loss = 0.0395
Iteration 80, loss = 0.0410
--- Epoch 22 / 50 - 22 epochs total
Iteration 0, loss = 0.0369
Iteration 20, loss = 0.0385
Iteration 40, loss = 0.0337
Iteration 60, loss = 0.0424
Iteration 80, loss = 0.0314
--- Epoch 23 / 50 - 23 epochs total
Iteration 0, loss = 0.0529
Iteration 20, loss = 0.0471
Iteration 40, loss = 0.0548
Iteration 60, loss = 0.0590
Iteration 80, loss = 0.0609
--- Epoch 24 / 50 - 24 epochs total
Iteration 0, loss = 0.0198
Iteration 20, loss = 0.0695
Iteration 40, loss = 0.0591
Iteration 60, loss = 0.0346
Iteration 80, loss = 0.0626
--- Epoch 25 / 50 - 25 epochs total
Iteration 0, loss = 0.0495
Iteration 20, loss = 0.0444
Iteration 40, loss = 0.0306
Iteration 60, loss = 0.0263
Iteration 80, loss = 0.0384
--- Epoch 26 / 50 - 26 epochs total
Iteration 0, loss = 0.0502
Iteration 20, loss = 0.0604
Iteration 40, loss = 0.0319
Iteration 60, loss = 0.0243
Iteration 80, loss = 0.0575
--- Epoch 27 / 50 - 27 epochs total
Iteration 0, loss = 0.0354
Iteration 20, loss = 0.0336
Iteration 40, loss = 0.0672
Iteration 60, loss = 0.0593
Iteration 80, loss = 0.0332
--- Epoch 28 / 50 - 28 epochs total
Iteration 0, loss = 0.0344
Iteration 20, loss = 0.0280
Iteration 40, loss = 0.0215
Iteration 60, loss = 0.0270
Iteration 80, loss = 0.0566
--- Epoch 29 / 50 - 29 epochs total
Iteration 0, loss = 0.0398
Iteration 20, loss = 0.0439
Iteration 40, loss = 0.0233
Iteration 60, loss = 0.0339
Iteration 80, loss = 0.0299
--- Epoch 30 / 50 - 30 epochs total
Iteration 0, loss = 0.0281
Iteration 20, loss = 0.0432
Iteration 40, loss = 0.0421
Iteration 60, loss = 0.0353
Iteration 80, loss = 0.0378
--- Epoch 31 / 50 - 31 epochs total
Iteration 0, loss = 0.0339
Iteration 20, loss = 0.0268
Iteration 40, loss = 0.0414
Iteration 60, loss = 0.0233
Iteration 80, loss = 0.0343
--- Epoch 32 / 50 - 32 epochs total
Iteration 0, loss = 0.0312
Iteration 20, loss = 0.0274
Iteration 40, loss = 0.0481
Iteration 60, loss = 0.0209
Iteration 80, loss = 0.0338
--- Epoch 33 / 50 - 33 epochs total
Iteration 0, loss = 0.0281
Iteration 20, loss = 0.0562
Iteration 40, loss = 0.0288
Iteration 60, loss = 0.0451
Iteration 80, loss = 0.0420
--- Epoch 34 / 50 - 34 epochs total
Iteration 0, loss = 0.0306
Iteration 20, loss = 0.0394
Iteration 40, loss = 0.0407
Iteration 60, loss = 0.0206
Iteration 80, loss = 0.0593
--- Epoch 35 / 50 - 35 epochs total
Iteration 0, loss = 0.0292
Iteration 20, loss = 0.0303
Iteration 40, loss = 0.0340
Iteration 60, loss = 0.0511
Iteration 80, loss = 0.0219
--- Epoch 36 / 50 - 36 epochs total
Iteration 0, loss = 0.0402
Iteration 20, loss = 0.0206
Iteration 40, loss = 0.0390
Iteration 60, loss = 0.0335
Iteration 80, loss = 0.0423
--- Epoch 37 / 50 - 37 epochs total
Iteration 0, loss = 0.0245
Iteration 20, loss = 0.0332
Iteration 40, loss = 0.0388
Iteration 60, loss = 0.0289
Iteration 80, loss = 0.0292
--- Epoch 38 / 50 - 38 epochs total
Iteration 0, loss = 0.0372
Iteration 20, loss = 0.0211
Iteration 40, loss = 0.0418
Iteration 60, loss = 0.0306
Iteration 80, loss = 0.0417
--- Epoch 39 / 50 - 39 epochs total
Iteration 0, loss = 0.0335
Iteration 20, loss = 0.1187
Iteration 40, loss = 0.0342
Iteration 60, loss = 0.0413
Iteration 80, loss = 0.0367
--- Epoch 40 / 50 - 40 epochs total
Iteration 0, loss = 0.0327
Iteration 20, loss = 0.0363
Iteration 40, loss = 0.0793
Iteration 60, loss = 0.0334
Iteration 80, loss = 0.0324
--- Epoch 41 / 50 - 41 epochs total
Iteration 0, loss = 0.0254
Iteration 20, loss = 0.0336
Iteration 40, loss = 0.0627
Iteration 60, loss = 0.0296
Iteration 80, loss = 0.0430
--- Epoch 42 / 50 - 42 epochs total
Iteration 0, loss = 0.0211
Iteration 20, loss = 0.0271
Iteration 40, loss = 0.0326
Iteration 60, loss = 0.0313
Iteration 80, loss = 0.0233
--- Epoch 43 / 50 - 43 epochs total
Iteration 0, loss = 0.0271
Iteration 20, loss = 0.0390
Iteration 40, loss = 0.0335
Iteration 60, loss = 0.0272
Iteration 80, loss = 0.0192
--- Epoch 44 / 50 - 44 epochs total
Iteration 0, loss = 0.0207
Iteration 20, loss = 0.0490
Iteration 40, loss = 0.0306
Iteration 60, loss = 0.0333
Iteration 80, loss = 0.0384
--- Epoch 45 / 50 - 45 epochs total
Iteration 0, loss = 0.0321
Iteration 20, loss = 0.0427
Iteration 40, loss = 0.0443
Iteration 60, loss = 0.0243
Iteration 80, loss = 0.0163
--- Epoch 46 / 50 - 46 epochs total
Iteration 0, loss = 0.0286
Iteration 20, loss = 0.0669
Iteration 40, loss = 0.0432
Iteration 60, loss = 0.0391
Iteration 80, loss = 0.0431
--- Epoch 47 / 50 - 47 epochs total
Iteration 0, loss = 0.0348
Iteration 20, loss = 0.0540
Iteration 40, loss = 0.0531
Iteration 60, loss = 0.0498
Iteration 80, loss = 0.0196
--- Epoch 48 / 50 - 48 epochs total
Iteration 0, loss = 0.0172
Iteration 20, loss = 0.0176
Iteration 40, loss = 0.0553
Iteration 60, loss = 0.0299
Iteration 80, loss = 0.0244
--- Epoch 49 / 50 - 49 epochs total
Iteration 0, loss = 0.0242
Iteration 20, loss = 0.0572
Iteration 40, loss = 0.0327
Iteration 60, loss = 0.0355
Iteration 80, loss = 0.0435
--- Epoch 50 / 50 - 50 epochs total
Iteration 0, loss = 0.0332
Iteration 20, loss = 0.0262
Iteration 40, loss = 0.0292
Iteration 60, loss = 0.0533
Iteration 80, loss = 0.0221
In [153]:
testModel(model3)
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
In [62]:
def detectEdges(image):
     ret = torch.zeros(image.shape)
     
     filter = torch.tensor([[-1, -1, -1], [-1, 8, -1], [-1, -1, -1]]).to(device=device, dtype=dtype).view(1, 1, 3, 3)
     grayscale = image[0, :, :].view(1, 1, 32, 32)
     
     edges = F.conv2d(grayscale, filter, padding=1)
     edges = edges[0][0]
#      edges = ndimage.convolve(grayscale, filter, mode='constant', cval=0.0)
     
     ret[0, :, :] = edges
     ret[1, :, :] = edges
     ret[2, :, :] = edges
    
     ret[ret < 0.15] = 0
     ret[ret > 0.15] = 1
     return ret

Test edge detection

In [63]:
n = 10
idx = np.random.choice(range(data["X_test"].shape[0]), n)

fig, axs = plt.subplots(n, 3)
fig.set_size_inches(10, 25)

# Set axis titles
axs[0, 0].title.set_text('X data')
axs[0, 1].title.set_text('Edges')
axs[0, 2].title.set_text('Actual')

for i in range(n):
     x_data = data["X_test"][idx[i]]
     y_data = data["y_test"][idx[i]]

     axs[i, 0].imshow(x_data.transpose(1, 2, 0))
     axs[i, 1].imshow(detectEdges(torch.from_numpy(y_data).to(device=device, dtype=dtype)).detach().numpy().transpose(1, 2, 0))
     axs[i, 2].imshow(y_data.transpose(1, 2, 0))

Build custom loss functions using adjacent difference to smoothen results and edge detection to keep image structure (Edge detection loss didnt work well in any of my tests so it is not widely used later on)

In [337]:
def custom_loss(output, target):
     output = output.view(3, 32, 32)
     target = target.view(3, 32, 32)
     
     # Overall mean squared error
     color_loss = torch.mean((output - target) ** 2)
     
     # Take difference between adjacent pixels into account to smoothen results
     horizontal_loss = torch.mean((output[:, 1:] - output[:, :-1]) ** 2)
     vertical_loss = torch.mean((output[1:, :] - output[:-1, :]) ** 2)

     loss = color_loss * 0.8 + horizontal_loss * 0.1 + vertical_loss * 0.11
    
     return loss
In [225]:
def custom_loss_edges(output, target):
     output = output.view(3, 32, 32)
     target = target.view(3, 32, 32)
     
     output_edges = detectEdges(output)
     target_edges = detectEdges(target)
     
     edge_loss = torch.mean((output_edges - target_edges) ** 2)
     
     color_loss = torch.mean((output - target) ** 2)
     horizontal_loss = torch.mean((output[:, 1:] - output[:, :-1]) ** 2)
     vertical_loss = torch.mean((output[1:, :] - output[:-1, :]) ** 2)
     
     loss = color_loss * 0.6 + horizontal_loss * 0.1 + vertical_loss * 0.1 + edge_loss * 0.2

     return loss
In [ ]:
learning_rate = 1e-2
model4 = ConvNet()
optimizer = optim.SGD(model4.parameters(), lr=learning_rate)
In [452]:
train(model4, optimizer, epochs=300, criterion=custom_loss)
--- Epoch 1 / 300
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0125
Iteration 80, loss = 0.0049
--- Epoch 2 / 300
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0119
--- Epoch 3 / 300
Iteration 0, loss = 0.0120
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0176
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0149
--- Epoch 4 / 300
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0155
Iteration 80, loss = 0.0162
--- Epoch 5 / 300
Iteration 0, loss = 0.0103
Iteration 20, loss = 0.0117
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0195
Iteration 80, loss = 0.0104
--- Epoch 6 / 300
Iteration 0, loss = 0.0161
Iteration 20, loss = 0.0251
Iteration 40, loss = 0.0237
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0178
--- Epoch 7 / 300
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0073
--- Epoch 8 / 300
Iteration 0, loss = 0.0141
Iteration 20, loss = 0.0271
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0091
--- Epoch 9 / 300
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0136
--- Epoch 10 / 300
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0070
--- Epoch 11 / 300
Iteration 0, loss = 0.0123
Iteration 20, loss = 0.0145
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0216
--- Epoch 12 / 300
Iteration 0, loss = 0.0196
Iteration 20, loss = 0.0195
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0098
--- Epoch 13 / 300
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0181
Iteration 40, loss = 0.0167
Iteration 60, loss = 0.0199
Iteration 80, loss = 0.0089
--- Epoch 14 / 300
Iteration 0, loss = 0.0207
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0260
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0170
--- Epoch 15 / 300
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0269
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0132
Iteration 80, loss = 0.0063
--- Epoch 16 / 300
Iteration 0, loss = 0.0097
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0121
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0156
--- Epoch 17 / 300
Iteration 0, loss = 0.0252
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0183
Iteration 80, loss = 0.0112
--- Epoch 18 / 300
Iteration 0, loss = 0.0192
Iteration 20, loss = 0.0151
Iteration 40, loss = 0.0184
Iteration 60, loss = 0.0173
Iteration 80, loss = 0.0152
--- Epoch 19 / 300
Iteration 0, loss = 0.0294
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0131
Iteration 80, loss = 0.0097
--- Epoch 20 / 300
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0203
Iteration 40, loss = 0.0156
Iteration 60, loss = 0.0228
Iteration 80, loss = 0.0178
--- Epoch 21 / 300
Iteration 0, loss = 0.0166
Iteration 20, loss = 0.0155
Iteration 40, loss = 0.0133
Iteration 60, loss = 0.0161
Iteration 80, loss = 0.0061
--- Epoch 22 / 300
Iteration 0, loss = 0.0203
Iteration 20, loss = 0.0222
Iteration 40, loss = 0.0139
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0090
--- Epoch 23 / 300
Iteration 0, loss = 0.0130
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0164
--- Epoch 24 / 300
Iteration 0, loss = 0.0153
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0144
--- Epoch 25 / 300
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0402
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0100
--- Epoch 26 / 300
Iteration 0, loss = 0.0188
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0170
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0146
--- Epoch 27 / 300
Iteration 0, loss = 0.0237
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0168
Iteration 60, loss = 0.0179
Iteration 80, loss = 0.0120
--- Epoch 28 / 300
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0180
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0097
Iteration 80, loss = 0.0250
--- Epoch 29 / 300
Iteration 0, loss = 0.0101
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0130
--- Epoch 30 / 300
Iteration 0, loss = 0.0150
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0108
Iteration 80, loss = 0.0059
--- Epoch 31 / 300
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0102
Iteration 80, loss = 0.0145
--- Epoch 32 / 300
Iteration 0, loss = 0.0354
Iteration 20, loss = 0.0159
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0216
Iteration 80, loss = 0.0199
--- Epoch 33 / 300
Iteration 0, loss = 0.0212
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0116
Iteration 80, loss = 0.0138
--- Epoch 34 / 300
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0182
Iteration 40, loss = 0.0167
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0172
--- Epoch 35 / 300
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0174
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0131
Iteration 80, loss = 0.0421
--- Epoch 36 / 300
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0147
--- Epoch 37 / 300
Iteration 0, loss = 0.0250
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0691
Iteration 60, loss = 0.0144
Iteration 80, loss = 0.0110
--- Epoch 38 / 300
Iteration 0, loss = 0.0097
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0209
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0112
--- Epoch 39 / 300
Iteration 0, loss = 0.0185
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0167
Iteration 60, loss = 0.0316
Iteration 80, loss = 0.0193
--- Epoch 40 / 300
Iteration 0, loss = 0.0179
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0241
Iteration 80, loss = 0.0086
--- Epoch 41 / 300
Iteration 0, loss = 0.0179
Iteration 20, loss = 0.0159
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0096
--- Epoch 42 / 300
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0148
Iteration 40, loss = 0.0167
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0130
--- Epoch 43 / 300
Iteration 0, loss = 0.0128
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0216
Iteration 60, loss = 0.0116
Iteration 80, loss = 0.0194
--- Epoch 44 / 300
Iteration 0, loss = 0.0126
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0202
--- Epoch 45 / 300
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0176
Iteration 40, loss = 0.0203
Iteration 60, loss = 0.0123
Iteration 80, loss = 0.0105
--- Epoch 46 / 300
Iteration 0, loss = 0.0101
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0179
Iteration 80, loss = 0.0149
--- Epoch 47 / 300
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0157
Iteration 40, loss = 0.0254
Iteration 60, loss = 0.0229
Iteration 80, loss = 0.0160
--- Epoch 48 / 300
Iteration 0, loss = 0.0211
Iteration 20, loss = 0.0170
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0102
--- Epoch 49 / 300
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0166
Iteration 40, loss = 0.0180
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0071
--- Epoch 50 / 300
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0131
--- Epoch 51 / 300
Iteration 0, loss = 0.0082
Iteration 20, loss = 0.0133
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0188
Iteration 80, loss = 0.0120
--- Epoch 52 / 300
Iteration 0, loss = 0.0199
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0187
Iteration 80, loss = 0.0241
--- Epoch 53 / 300
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0259
Iteration 40, loss = 0.0297
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0121
--- Epoch 54 / 300
Iteration 0, loss = 0.0173
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0102
--- Epoch 55 / 300
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0293
--- Epoch 56 / 300
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0176
--- Epoch 57 / 300
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0188
Iteration 80, loss = 0.0059
--- Epoch 58 / 300
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0145
Iteration 80, loss = 0.0094
--- Epoch 59 / 300
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0166
--- Epoch 60 / 300
Iteration 0, loss = 0.0217
Iteration 20, loss = 0.0137
Iteration 40, loss = 0.0147
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0113
--- Epoch 61 / 300
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0221
Iteration 40, loss = 0.0214
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0072
--- Epoch 62 / 300
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0162
Iteration 80, loss = 0.0184
--- Epoch 63 / 300
Iteration 0, loss = 0.0173
Iteration 20, loss = 0.0212
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0123
--- Epoch 64 / 300
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0157
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0093
--- Epoch 65 / 300
Iteration 0, loss = 0.0157
Iteration 20, loss = 0.0213
Iteration 40, loss = 0.0199
Iteration 60, loss = 0.0164
Iteration 80, loss = 0.0090
--- Epoch 66 / 300
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0212
Iteration 60, loss = 0.0165
Iteration 80, loss = 0.0039
--- Epoch 67 / 300
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0204
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0134
--- Epoch 68 / 300
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0212
Iteration 60, loss = 0.0128
Iteration 80, loss = 0.0088
--- Epoch 69 / 300
Iteration 0, loss = 0.0314
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0103
--- Epoch 70 / 300
Iteration 0, loss = 0.0084
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0084
--- Epoch 71 / 300
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0140
Iteration 40, loss = 0.0131
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0125
--- Epoch 72 / 300
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0132
Iteration 40, loss = 0.0223
Iteration 60, loss = 0.0227
Iteration 80, loss = 0.0034
--- Epoch 73 / 300
Iteration 0, loss = 0.0083
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0134
Iteration 60, loss = 0.0145
Iteration 80, loss = 0.0091
--- Epoch 74 / 300
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0264
--- Epoch 75 / 300
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0144
--- Epoch 76 / 300
Iteration 0, loss = 0.0083
Iteration 20, loss = 0.0196
Iteration 40, loss = 0.0223
Iteration 60, loss = 0.0211
Iteration 80, loss = 0.0163
--- Epoch 77 / 300
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0268
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0112
---------------------------------------------------------------------------
KeyboardInterrupt                         Traceback (most recent call last)
<ipython-input-452-13970f5e6e2d> in <module>
----> 1 train(model4, optimizer, epochs=300, criterion=custom_loss)

<ipython-input-5-6d69c0665347> in train(model, optimizer, epochs, criterion)
     34             # Zero out all of the gradients for the variables which the optimizer
     35             # will update.
---> 36             optimizer.zero_grad()
     37 
     38             # This is the backwards pass: compute the gradient of the loss with

KeyboardInterrupt: 
In [453]:
testModel(model4)
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
In [66]:
learning_rate = 1e-2
model5 = ConvNet()
optimizer = optim.SGD(model5.parameters(), lr=learning_rate)
In [72]:
train(model5, optimizer, epochs=300, criterion=custom_loss_edges)
--- Epoch 1 / 300
Iteration 0, loss = 0.1264
Iteration 20, loss = 0.0959
Iteration 40, loss = 0.0950
Iteration 60, loss = 0.1142
Iteration 80, loss = 0.1146
--- Epoch 2 / 300
Iteration 0, loss = 0.1114
Iteration 20, loss = 0.0938
Iteration 40, loss = 0.0967
Iteration 60, loss = 0.1293
Iteration 80, loss = 0.1029
--- Epoch 3 / 300
Iteration 0, loss = 0.1161
Iteration 20, loss = 0.1257
Iteration 40, loss = 0.1162
Iteration 60, loss = 0.1176
Iteration 80, loss = 0.0968
--- Epoch 4 / 300
Iteration 0, loss = 0.0887
Iteration 20, loss = 0.1108
Iteration 40, loss = 0.0977
Iteration 60, loss = 0.1076
Iteration 80, loss = 0.0902
--- Epoch 5 / 300
Iteration 0, loss = 0.1177
Iteration 20, loss = 0.0982
Iteration 40, loss = 0.0957
Iteration 60, loss = 0.1109
Iteration 80, loss = 0.1038
--- Epoch 6 / 300
Iteration 0, loss = 0.0996
Iteration 20, loss = 0.0890
Iteration 40, loss = 0.1083
Iteration 60, loss = 0.1139
Iteration 80, loss = 0.1148
--- Epoch 7 / 300
Iteration 0, loss = 0.1036
Iteration 20, loss = 0.1009
Iteration 40, loss = 0.0886
Iteration 60, loss = 0.0989
Iteration 80, loss = 0.1176
--- Epoch 8 / 300
Iteration 0, loss = 0.0981
Iteration 20, loss = 0.1265
Iteration 40, loss = 0.1045
Iteration 60, loss = 0.1128
Iteration 80, loss = 0.0987
--- Epoch 9 / 300
Iteration 0, loss = 0.0919
Iteration 20, loss = 0.1085
Iteration 40, loss = 0.1061
Iteration 60, loss = 0.1128
Iteration 80, loss = 0.1039
--- Epoch 10 / 300
Iteration 0, loss = 0.1030
Iteration 20, loss = 0.0932
Iteration 40, loss = 0.1131
Iteration 60, loss = 0.1318
Iteration 80, loss = 0.1277
--- Epoch 11 / 300
Iteration 0, loss = 0.1366
Iteration 20, loss = 0.1155
Iteration 40, loss = 0.1211
Iteration 60, loss = 0.0946
Iteration 80, loss = 0.1204
--- Epoch 12 / 300
Iteration 0, loss = 0.1139
Iteration 20, loss = 0.0945
Iteration 40, loss = 0.0955
Iteration 60, loss = 0.1091
Iteration 80, loss = 0.0902
--- Epoch 13 / 300
Iteration 0, loss = 0.1126
Iteration 20, loss = 0.0948
Iteration 40, loss = 0.0972
Iteration 60, loss = 0.0968
Iteration 80, loss = 0.1454
--- Epoch 14 / 300
Iteration 0, loss = 0.1354
Iteration 20, loss = 0.1142
Iteration 40, loss = 0.0934
Iteration 60, loss = 0.1096
Iteration 80, loss = 0.0959
---------------------------------------------------------------------------
KeyboardInterrupt                         Traceback (most recent call last)
<ipython-input-72-157c50dede99> in <module>
----> 1 train(model5, optimizer, epochs=300, criterion=custom_loss_edges)

<ipython-input-6-6d69c0665347> in train(model, optimizer, epochs, criterion)
     34             # Zero out all of the gradients for the variables which the optimizer
     35             # will update.
---> 36             optimizer.zero_grad()
     37 
     38             # This is the backwards pass: compute the gradient of the loss with

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/optim/optimizer.py in zero_grad(self)
    170                 if p.grad is not None:
    171                     p.grad.detach_()
--> 172                     p.grad.zero_()
    173 
    174     def step(self, closure):

KeyboardInterrupt: 
In [73]:
testModel(model5)
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
In [189]:
class ConvNet2(nn.Module):
    def __init__(self):
        super().__init__()
        self.epochsTrained = 0
          
        self.batchnorm1 = nn.BatchNorm2d(24)
        self.batchnorm2 = nn.BatchNorm2d(24)
        self.batchnorm3 = nn.BatchNorm2d(12)
        self.batchnorm4 = nn.BatchNorm2d(12)
    
        self.conv1 = nn.Conv2d(3, 24, kernel_size=6, stride=1, padding=2) # 48 6x6 filters
        self.conv2 = nn.Conv2d(24, 24, kernel_size=4, stride=1, padding=1) # 48 4x4 filters
        self.conv3 = nn.Conv2d(24, 12, kernel_size=4, stride=1, padding=1) # 24 4x4 filters
        self.conv4 = nn.Conv2d(12, 12, kernel_size=3, stride=1, padding=1) # 24 3x3 filters
        self.fc = nn.Linear(13164, 32 * 32 * 3)

    def forward(self, x):
        x2 = x.unsqueeze(0)
        scores = self.batchnorm1(F.relu(self.conv1(x2)));
        scores = self.batchnorm2(F.relu(self.conv2(scores)));
        scores = self.batchnorm3(F.relu(self.conv3(scores)));
        scores = self.batchnorm4(torch.tanh(self.conv4(scores)));
               
        with_x = torch.cat((scores.view(-1), x.view(-1)), 0)
        scores = self.fc(with_x)
          
        return scores
In [125]:
learning_rate = 1e-2
model6 = ConvNet2()
optimizer = optim.SGD(model6.parameters(), lr=learning_rate)
In [128]:
train(model6, optimizer, epochs=250, criterion=custom_loss)
--- Epoch 1 / 250
Iteration 0, loss = 0.1323
Iteration 20, loss = 0.1473
Iteration 40, loss = 0.1414
Iteration 60, loss = 0.1272
Iteration 80, loss = 0.1903
--- Epoch 2 / 250
Iteration 0, loss = 0.0930
Iteration 20, loss = 0.0972
Iteration 40, loss = 0.1379
Iteration 60, loss = 0.0825
Iteration 80, loss = 0.1351
--- Epoch 3 / 250
Iteration 0, loss = 0.1339
Iteration 20, loss = 0.1859
Iteration 40, loss = 0.1257
Iteration 60, loss = 0.1184
Iteration 80, loss = 0.0991
--- Epoch 4 / 250
Iteration 0, loss = 0.1137
Iteration 20, loss = 0.0941
Iteration 40, loss = 0.1762
Iteration 60, loss = 0.1596
Iteration 80, loss = 0.1572
--- Epoch 5 / 250
Iteration 0, loss = 0.1331
Iteration 20, loss = 0.1142
Iteration 40, loss = 0.1244
Iteration 60, loss = 0.1387
Iteration 80, loss = 0.1038
--- Epoch 6 / 250
Iteration 0, loss = 0.0847
Iteration 20, loss = 0.1252
Iteration 40, loss = 0.1097
Iteration 60, loss = 0.1029
Iteration 80, loss = 0.1377
--- Epoch 7 / 250
Iteration 0, loss = 0.1077
Iteration 20, loss = 0.1487
Iteration 40, loss = 0.0997
Iteration 60, loss = 0.1337
Iteration 80, loss = 0.1576
--- Epoch 8 / 250
Iteration 0, loss = 0.1305
Iteration 20, loss = 0.1682
Iteration 40, loss = 0.1038
Iteration 60, loss = 0.1402
Iteration 80, loss = 0.1207
--- Epoch 9 / 250
Iteration 0, loss = 0.0850
Iteration 20, loss = 0.1723
Iteration 40, loss = 0.1478
Iteration 60, loss = 0.1355
Iteration 80, loss = 0.0900
--- Epoch 10 / 250
Iteration 0, loss = 0.0949
Iteration 20, loss = 0.1598
Iteration 40, loss = 0.1249
Iteration 60, loss = 0.0941
Iteration 80, loss = 0.1503
--- Epoch 11 / 250
Iteration 0, loss = 0.0915
Iteration 20, loss = 0.1141
Iteration 40, loss = 0.1179
Iteration 60, loss = 0.0786
Iteration 80, loss = 0.1332
--- Epoch 12 / 250
Iteration 0, loss = 0.1909
Iteration 20, loss = 0.1306
---------------------------------------------------------------------------
KeyboardInterrupt                         Traceback (most recent call last)
<ipython-input-128-1446adb45ff8> in <module>
----> 1 train(model6, optimizer, epochs=250, criterion=custom_loss)

<ipython-input-6-6d69c0665347> in train(model, optimizer, epochs, criterion)
     38             # This is the backwards pass: compute the gradient of the loss with
     39             # respect to each  parameter of the model.
---> 40             loss.backward()
     41 
     42             # Actually update the parameters of the model using the gradients

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/tensor.py in backward(self, gradient, retain_graph, create_graph)
    183                 products. Defaults to ``False``.
    184         """
--> 185         torch.autograd.backward(self, gradient, retain_graph, create_graph)
    186 
    187     def register_hook(self, hook):

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/autograd/__init__.py in backward(tensors, grad_tensors, retain_graph, create_graph, grad_variables)
    125     Variable._execution_engine.run_backward(
    126         tensors, grad_tensors, retain_graph, create_graph,
--> 127         allow_unreachable=True)  # allow_unreachable flag
    128 
    129 

KeyboardInterrupt: 
In [129]:
testModel(model5)
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).

Try training on a specific class type to make it easier for netowrk

In [6]:
classes = [ "airplane", "automobile", "bird", "cat", "deer", "dog", "frog", "horse", "ship", "truck"]

for c in range(len(classes)):
     cname = classes[c]
     train_idx = np.where(unproccessed_data["y_train"] == c)
     test_idx = np.where(unproccessed_data["y_test"] == c)
     val_idx = np.where(unproccessed_data["y_val"] == c)

     data["y_train_" + cname] = unproccessed_data["X_train"][train_idx]
     data["y_val_" + cname] = unproccessed_data["X_val"][val_idx]
     data["y_test_" + cname] = unproccessed_data["X_test"][test_idx]

     data["X_train_" + cname] = convertToBW(unproccessed_data["X_train"][train_idx]);
     data["X_val_" + cname] = convertToBW(unproccessed_data["X_val"][val_idx]);
     data["X_test_" + cname] = convertToBW(unproccessed_data["X_test"][test_idx]);
dict_keys(['y_train', 'y_val', 'y_test', 'X_train', 'X_val', 'X_test', 'y_train_airplane', 'y_val_airplane', 'y_test_airplane', 'X_train_airplane', 'X_val_airplane', 'X_test_airplane', 'y_train_automobile', 'y_val_automobile', 'y_test_automobile', 'X_train_automobile', 'X_val_automobile', 'X_test_automobile', 'y_train_bird', 'y_val_bird', 'y_test_bird', 'X_train_bird', 'X_val_bird', 'X_test_bird', 'y_train_cat', 'y_val_cat', 'y_test_cat', 'X_train_cat', 'X_val_cat', 'X_test_cat', 'y_train_deer', 'y_val_deer', 'y_test_deer', 'X_train_deer', 'X_val_deer', 'X_test_deer', 'y_train_dog', 'y_val_dog', 'y_test_dog', 'X_train_dog', 'X_val_dog', 'X_test_dog', 'y_train_frog', 'y_val_frog', 'y_test_frog', 'X_train_frog', 'X_val_frog', 'X_test_frog', 'y_train_horse', 'y_val_horse', 'y_test_horse', 'X_train_horse', 'X_val_horse', 'X_test_horse', 'y_train_ship', 'y_val_ship', 'y_test_ship', 'X_train_ship', 'X_val_ship', 'X_test_ship', 'y_train_truck', 'y_val_truck', 'y_test_truck', 'X_train_truck', 'X_val_truck', 'X_test_truck'])
In [214]:
learning_rate = 5e-3
model7 = ConvNet2()
optimizer = optim.SGD(model7.parameters(), lr=learning_rate)
In [215]:
train(model7, optimizer, epochs=1000, x_train=data["X_train_class"],  y_train=data["y_train_class"], criterion=custom_loss)
--- Epoch 1 / 1000
Iteration 0, loss = 0.5163
Iteration 20, loss = 0.4907
Iteration 40, loss = 0.3813
Iteration 60, loss = 0.2225
Iteration 80, loss = 0.2141
--- Epoch 2 / 1000
Iteration 0, loss = 0.1437
Iteration 20, loss = 0.1209
Iteration 40, loss = 0.1181
Iteration 60, loss = 0.1140
Iteration 80, loss = 0.1295
--- Epoch 3 / 1000
Iteration 0, loss = 0.1044
Iteration 20, loss = 0.0945
Iteration 40, loss = 0.0883
Iteration 60, loss = 0.0771
Iteration 80, loss = 0.1358
--- Epoch 4 / 1000
Iteration 0, loss = 0.0540
Iteration 20, loss = 0.0467
Iteration 40, loss = 0.0336
Iteration 60, loss = 0.0385
Iteration 80, loss = 0.0180
--- Epoch 5 / 1000
Iteration 0, loss = 0.0517
Iteration 20, loss = 0.0614
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0386
Iteration 80, loss = 0.2632
--- Epoch 6 / 1000
Iteration 0, loss = 0.0245
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.1029
Iteration 60, loss = 0.0547
Iteration 80, loss = 0.0560
--- Epoch 7 / 1000
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0323
Iteration 40, loss = 0.0297
Iteration 60, loss = 0.0215
Iteration 80, loss = 0.0278
--- Epoch 8 / 1000
Iteration 0, loss = 0.0288
Iteration 20, loss = 0.0433
Iteration 40, loss = 0.0269
Iteration 60, loss = 0.0411
Iteration 80, loss = 0.0266
--- Epoch 9 / 1000
Iteration 0, loss = 0.0520
Iteration 20, loss = 0.0614
Iteration 40, loss = 0.0220
Iteration 60, loss = 0.0699
Iteration 80, loss = 0.0410
--- Epoch 10 / 1000
Iteration 0, loss = 0.0454
Iteration 20, loss = 0.2740
Iteration 40, loss = 0.0621
Iteration 60, loss = 0.0261
Iteration 80, loss = 0.0162
--- Epoch 11 / 1000
Iteration 0, loss = 0.0524
Iteration 20, loss = 0.1356
Iteration 40, loss = 0.0476
Iteration 60, loss = 0.0168
Iteration 80, loss = 0.0620
--- Epoch 12 / 1000
Iteration 0, loss = 0.0308
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0632
Iteration 60, loss = 0.0402
Iteration 80, loss = 0.0662
--- Epoch 13 / 1000
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.1502
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0163
Iteration 80, loss = 0.0521
--- Epoch 14 / 1000
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0221
Iteration 40, loss = 0.0472
Iteration 60, loss = 0.0219
Iteration 80, loss = 0.0227
--- Epoch 15 / 1000
Iteration 0, loss = 0.0262
Iteration 20, loss = 0.0331
Iteration 40, loss = 0.0581
Iteration 60, loss = 0.0273
Iteration 80, loss = 0.0097
--- Epoch 16 / 1000
Iteration 0, loss = 0.0416
Iteration 20, loss = 0.0209
Iteration 40, loss = 0.0172
Iteration 60, loss = 0.0391
Iteration 80, loss = 0.0136
--- Epoch 17 / 1000
Iteration 0, loss = 0.0163
Iteration 20, loss = 0.0383
Iteration 40, loss = 0.0239
Iteration 60, loss = 0.0339
Iteration 80, loss = 0.0503
--- Epoch 18 / 1000
Iteration 0, loss = 0.0419
Iteration 20, loss = 0.0180
Iteration 40, loss = 0.0152
Iteration 60, loss = 0.0313
Iteration 80, loss = 0.0396
--- Epoch 19 / 1000
Iteration 0, loss = 0.0203
Iteration 20, loss = 0.0398
Iteration 40, loss = 0.0220
Iteration 60, loss = 0.1211
Iteration 80, loss = 0.0583
--- Epoch 20 / 1000
Iteration 0, loss = 0.0395
Iteration 20, loss = 0.0629
Iteration 40, loss = 0.0217
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0304
--- Epoch 21 / 1000
Iteration 0, loss = 0.0188
Iteration 20, loss = 0.0313
Iteration 40, loss = 0.0239
Iteration 60, loss = 0.0747
Iteration 80, loss = 0.0119
--- Epoch 22 / 1000
Iteration 0, loss = 0.0401
Iteration 20, loss = 0.0099
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0185
--- Epoch 23 / 1000
Iteration 0, loss = 0.0225
Iteration 20, loss = 0.0245
Iteration 40, loss = 0.0240
Iteration 60, loss = 0.0128
Iteration 80, loss = 0.0425
--- Epoch 24 / 1000
Iteration 0, loss = 0.0215
Iteration 20, loss = 0.0117
Iteration 40, loss = 0.0301
Iteration 60, loss = 0.0595
Iteration 80, loss = 0.0138
--- Epoch 25 / 1000
Iteration 0, loss = 0.0402
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0263
Iteration 60, loss = 0.0313
Iteration 80, loss = 0.0091
--- Epoch 26 / 1000
Iteration 0, loss = 0.0198
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0317
Iteration 60, loss = 0.0206
Iteration 80, loss = 0.0406
--- Epoch 27 / 1000
Iteration 0, loss = 0.0377
Iteration 20, loss = 0.0367
Iteration 40, loss = 0.0697
Iteration 60, loss = 0.0375
Iteration 80, loss = 0.0241
--- Epoch 28 / 1000
Iteration 0, loss = 0.0295
Iteration 20, loss = 0.0183
Iteration 40, loss = 0.0169
Iteration 60, loss = 0.0361
Iteration 80, loss = 0.0107
--- Epoch 29 / 1000
Iteration 0, loss = 0.0550
Iteration 20, loss = 0.0414
Iteration 40, loss = 0.0296
Iteration 60, loss = 0.0179
Iteration 80, loss = 0.0166
--- Epoch 30 / 1000
Iteration 0, loss = 0.0230
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0400
Iteration 60, loss = 0.0717
Iteration 80, loss = 0.0482
--- Epoch 31 / 1000
Iteration 0, loss = 0.0391
Iteration 20, loss = 0.0224
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0201
Iteration 80, loss = 0.0165
--- Epoch 32 / 1000
Iteration 0, loss = 0.0379
Iteration 20, loss = 0.0352
Iteration 40, loss = 0.0183
Iteration 60, loss = 0.0624
Iteration 80, loss = 0.0251
--- Epoch 33 / 1000
Iteration 0, loss = 0.0240
Iteration 20, loss = 0.0300
Iteration 40, loss = 0.0416
Iteration 60, loss = 0.0236
Iteration 80, loss = 0.0365
--- Epoch 34 / 1000
Iteration 0, loss = 0.0231
Iteration 20, loss = 0.0346
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0182
--- Epoch 35 / 1000
Iteration 0, loss = 0.0196
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0253
Iteration 60, loss = 0.0188
Iteration 80, loss = 0.0393
--- Epoch 36 / 1000
Iteration 0, loss = 0.0299
Iteration 20, loss = 0.0293
Iteration 40, loss = 0.0411
Iteration 60, loss = 0.0381
Iteration 80, loss = 0.0346
--- Epoch 37 / 1000
Iteration 0, loss = 0.0211
Iteration 20, loss = 0.0241
Iteration 40, loss = 0.0253
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0234
--- Epoch 38 / 1000
Iteration 0, loss = 0.0458
Iteration 20, loss = 0.0430
Iteration 40, loss = 0.0123
Iteration 60, loss = 0.0342
Iteration 80, loss = 0.0122
--- Epoch 39 / 1000
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0430
Iteration 40, loss = 0.0305
Iteration 60, loss = 0.0245
Iteration 80, loss = 0.0105
--- Epoch 40 / 1000
Iteration 0, loss = 0.0285
Iteration 20, loss = 0.0288
Iteration 40, loss = 0.0351
Iteration 60, loss = 0.0193
Iteration 80, loss = 0.0182
--- Epoch 41 / 1000
Iteration 0, loss = 0.0215
Iteration 20, loss = 0.0124
Iteration 40, loss = 0.0369
Iteration 60, loss = 0.0319
Iteration 80, loss = 0.0225
--- Epoch 42 / 1000
Iteration 0, loss = 0.0176
Iteration 20, loss = 0.0278
Iteration 40, loss = 0.0158
Iteration 60, loss = 0.0450
Iteration 80, loss = 0.0220
--- Epoch 43 / 1000
Iteration 0, loss = 0.0210
Iteration 20, loss = 0.0141
Iteration 40, loss = 0.0275
Iteration 60, loss = 0.0138
Iteration 80, loss = 0.0320
--- Epoch 44 / 1000
Iteration 0, loss = 0.0664
Iteration 20, loss = 0.0175
Iteration 40, loss = 0.0199
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0283
--- Epoch 45 / 1000
Iteration 0, loss = 0.0232
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0316
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0123
--- Epoch 46 / 1000
Iteration 0, loss = 0.0200
Iteration 20, loss = 0.0132
Iteration 40, loss = 0.0210
Iteration 60, loss = 0.0339
Iteration 80, loss = 0.0177
--- Epoch 47 / 1000
Iteration 0, loss = 0.0280
Iteration 20, loss = 0.0240
Iteration 40, loss = 0.0388
Iteration 60, loss = 0.0185
Iteration 80, loss = 0.0533
--- Epoch 48 / 1000
Iteration 0, loss = 0.0459
Iteration 20, loss = 0.0182
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0639
Iteration 80, loss = 0.0358
--- Epoch 49 / 1000
Iteration 0, loss = 0.0227
Iteration 20, loss = 0.0481
Iteration 40, loss = 0.0399
Iteration 60, loss = 0.0158
Iteration 80, loss = 0.0396
--- Epoch 50 / 1000
Iteration 0, loss = 0.0191
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0265
Iteration 60, loss = 0.0308
Iteration 80, loss = 0.0324
--- Epoch 51 / 1000
Iteration 0, loss = 0.0276
Iteration 20, loss = 0.0343
Iteration 40, loss = 0.0155
Iteration 60, loss = 0.0221
Iteration 80, loss = 0.0337
--- Epoch 52 / 1000
Iteration 0, loss = 0.0360
Iteration 20, loss = 0.0185
Iteration 40, loss = 0.0221
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0352
--- Epoch 53 / 1000
Iteration 0, loss = 0.0365
Iteration 20, loss = 0.0185
Iteration 40, loss = 0.0211
Iteration 60, loss = 0.0462
Iteration 80, loss = 0.0185
--- Epoch 54 / 1000
Iteration 0, loss = 0.0172
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0452
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0195
--- Epoch 55 / 1000
Iteration 0, loss = 0.0202
Iteration 20, loss = 0.0232
Iteration 40, loss = 0.0166
Iteration 60, loss = 0.0251
Iteration 80, loss = 0.0262
--- Epoch 56 / 1000
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0215
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0312
--- Epoch 57 / 1000
Iteration 0, loss = 0.0200
Iteration 20, loss = 0.0347
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0166
Iteration 80, loss = 0.0248
--- Epoch 58 / 1000
Iteration 0, loss = 0.0280
Iteration 20, loss = 0.0231
Iteration 40, loss = 0.0176
Iteration 60, loss = 0.0302
Iteration 80, loss = 0.0135
--- Epoch 59 / 1000
Iteration 0, loss = 0.0239
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0205
Iteration 60, loss = 0.0321
Iteration 80, loss = 0.0263
--- Epoch 60 / 1000
Iteration 0, loss = 0.0213
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0420
Iteration 60, loss = 0.0288
Iteration 80, loss = 0.0458
--- Epoch 61 / 1000
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0124
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0264
Iteration 80, loss = 0.0568
--- Epoch 62 / 1000
Iteration 0, loss = 0.0481
Iteration 20, loss = 0.0230
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0136
Iteration 80, loss = 0.0302
--- Epoch 63 / 1000
Iteration 0, loss = 0.0271
Iteration 20, loss = 0.0217
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0278
--- Epoch 64 / 1000
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0439
Iteration 40, loss = 0.0184
Iteration 60, loss = 0.0288
Iteration 80, loss = 0.0240
--- Epoch 65 / 1000
Iteration 0, loss = 0.0308
Iteration 20, loss = 0.0133
Iteration 40, loss = 0.0164
Iteration 60, loss = 0.0172
Iteration 80, loss = 0.0070
--- Epoch 66 / 1000
Iteration 0, loss = 0.0419
Iteration 20, loss = 0.0496
Iteration 40, loss = 0.0151
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0146
--- Epoch 67 / 1000
Iteration 0, loss = 0.0520
Iteration 20, loss = 0.0169
Iteration 40, loss = 0.0399
Iteration 60, loss = 0.0223
Iteration 80, loss = 0.0188
--- Epoch 68 / 1000
Iteration 0, loss = 0.0240
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0268
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0098
--- Epoch 69 / 1000
Iteration 0, loss = 0.0826
Iteration 20, loss = 0.0194
Iteration 40, loss = 0.0347
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0188
--- Epoch 70 / 1000
Iteration 0, loss = 0.0217
Iteration 20, loss = 0.0117
Iteration 40, loss = 0.0173
Iteration 60, loss = 0.0216
Iteration 80, loss = 0.0166
--- Epoch 71 / 1000
Iteration 0, loss = 0.0323
Iteration 20, loss = 0.0216
Iteration 40, loss = 0.0229
Iteration 60, loss = 0.0577
Iteration 80, loss = 0.0388
--- Epoch 72 / 1000
Iteration 0, loss = 0.0289
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0189
Iteration 60, loss = 0.0230
Iteration 80, loss = 0.0085
--- Epoch 73 / 1000
Iteration 0, loss = 0.0295
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0258
Iteration 60, loss = 0.0294
Iteration 80, loss = 0.0128
--- Epoch 74 / 1000
Iteration 0, loss = 0.0415
Iteration 20, loss = 0.0526
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0283
Iteration 80, loss = 0.0200
--- Epoch 75 / 1000
Iteration 0, loss = 0.0234
Iteration 20, loss = 0.0146
Iteration 40, loss = 0.0276
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0158
--- Epoch 76 / 1000
Iteration 0, loss = 0.0402
Iteration 20, loss = 0.0414
Iteration 40, loss = 0.0146
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0116
--- Epoch 77 / 1000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0352
Iteration 40, loss = 0.0217
Iteration 60, loss = 0.0284
Iteration 80, loss = 0.0333
--- Epoch 78 / 1000
Iteration 0, loss = 0.0128
Iteration 20, loss = 0.0296
Iteration 40, loss = 0.0223
Iteration 60, loss = 0.0283
Iteration 80, loss = 0.0173
--- Epoch 79 / 1000
Iteration 0, loss = 0.0083
Iteration 20, loss = 0.0282
Iteration 40, loss = 0.0213
Iteration 60, loss = 0.0223
Iteration 80, loss = 0.0111
--- Epoch 80 / 1000
Iteration 0, loss = 0.0166
Iteration 20, loss = 0.0182
Iteration 40, loss = 0.0265
Iteration 60, loss = 0.0206
Iteration 80, loss = 0.0160
--- Epoch 81 / 1000
Iteration 0, loss = 0.0097
Iteration 20, loss = 0.0244
Iteration 40, loss = 0.0366
Iteration 60, loss = 0.0275
Iteration 80, loss = 0.0168
--- Epoch 82 / 1000
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0141
Iteration 40, loss = 0.0137
Iteration 60, loss = 0.0203
Iteration 80, loss = 0.0145
--- Epoch 83 / 1000
Iteration 0, loss = 0.0151
Iteration 20, loss = 0.0154
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0173
Iteration 80, loss = 0.0102
--- Epoch 84 / 1000
Iteration 0, loss = 0.0300
Iteration 20, loss = 0.0242
Iteration 40, loss = 0.0274
Iteration 60, loss = 0.0142
Iteration 80, loss = 0.0153
--- Epoch 85 / 1000
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0521
Iteration 40, loss = 0.0184
Iteration 60, loss = 0.0164
Iteration 80, loss = 0.0279
--- Epoch 86 / 1000
Iteration 0, loss = 0.0166
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0359
Iteration 60, loss = 0.0395
Iteration 80, loss = 0.0092
--- Epoch 87 / 1000
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0201
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0270
Iteration 80, loss = 0.0391
--- Epoch 88 / 1000
Iteration 0, loss = 0.0467
Iteration 20, loss = 0.0372
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0252
Iteration 80, loss = 0.0214
--- Epoch 89 / 1000
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0370
Iteration 40, loss = 0.0712
Iteration 60, loss = 0.0447
Iteration 80, loss = 0.0260
--- Epoch 90 / 1000
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0293
Iteration 40, loss = 0.0201
Iteration 60, loss = 0.0237
Iteration 80, loss = 0.0448
--- Epoch 91 / 1000
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0155
Iteration 40, loss = 0.0160
Iteration 60, loss = 0.0285
Iteration 80, loss = 0.0148
--- Epoch 92 / 1000
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0239
Iteration 40, loss = 0.0360
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0181
--- Epoch 93 / 1000
Iteration 0, loss = 0.0542
Iteration 20, loss = 0.0222
Iteration 40, loss = 0.0165
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0276
--- Epoch 94 / 1000
Iteration 0, loss = 0.0227
Iteration 20, loss = 0.0256
Iteration 40, loss = 0.0363
Iteration 60, loss = 0.0137
Iteration 80, loss = 0.0120
--- Epoch 95 / 1000
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0208
Iteration 40, loss = 0.0690
Iteration 60, loss = 0.0734
Iteration 80, loss = 0.0271
--- Epoch 96 / 1000
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0413
Iteration 40, loss = 0.0204
Iteration 60, loss = 0.0184
Iteration 80, loss = 0.0166
--- Epoch 97 / 1000
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0131
Iteration 40, loss = 0.0305
Iteration 60, loss = 0.0197
Iteration 80, loss = 0.0320
--- Epoch 98 / 1000
Iteration 0, loss = 0.0180
Iteration 20, loss = 0.0285
Iteration 40, loss = 0.0187
Iteration 60, loss = 0.0166
Iteration 80, loss = 0.0182
--- Epoch 99 / 1000
Iteration 0, loss = 0.0269
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0361
Iteration 60, loss = 0.0385
Iteration 80, loss = 0.0142
--- Epoch 100 / 1000
Iteration 0, loss = 0.0228
Iteration 20, loss = 0.0201
Iteration 40, loss = 0.0283
Iteration 60, loss = 0.0155
Iteration 80, loss = 0.0294
--- Epoch 101 / 1000
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0224
Iteration 40, loss = 0.0237
Iteration 60, loss = 0.0169
Iteration 80, loss = 0.0183
--- Epoch 102 / 1000
Iteration 0, loss = 0.0196
Iteration 20, loss = 0.0416
Iteration 40, loss = 0.0177
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0168
--- Epoch 103 / 1000
Iteration 0, loss = 0.0202
Iteration 20, loss = 0.0207
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0267
--- Epoch 104 / 1000
Iteration 0, loss = 0.0382
Iteration 20, loss = 0.0187
Iteration 40, loss = 0.0205
Iteration 60, loss = 0.0180
Iteration 80, loss = 0.0181
--- Epoch 105 / 1000
Iteration 0, loss = 0.0194
Iteration 20, loss = 0.0241
Iteration 40, loss = 0.0272
Iteration 60, loss = 0.0337
Iteration 80, loss = 0.0334
--- Epoch 106 / 1000
Iteration 0, loss = 0.0300
Iteration 20, loss = 0.0127
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0927
--- Epoch 107 / 1000
Iteration 0, loss = 0.0250
Iteration 20, loss = 0.0132
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0352
Iteration 80, loss = 0.0198
--- Epoch 108 / 1000
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0213
Iteration 40, loss = 0.0570
Iteration 60, loss = 0.0148
Iteration 80, loss = 0.0147
--- Epoch 109 / 1000
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0108
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0420
Iteration 80, loss = 0.0142
--- Epoch 110 / 1000
Iteration 0, loss = 0.0169
Iteration 20, loss = 0.0265
Iteration 40, loss = 0.0638
Iteration 60, loss = 0.0171
Iteration 80, loss = 0.0241
--- Epoch 111 / 1000
Iteration 0, loss = 0.0203
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0307
Iteration 80, loss = 0.0338
--- Epoch 112 / 1000
Iteration 0, loss = 0.0356
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0212
Iteration 60, loss = 0.0354
Iteration 80, loss = 0.0288
--- Epoch 113 / 1000
Iteration 0, loss = 0.0254
Iteration 20, loss = 0.0233
Iteration 40, loss = 0.0313
Iteration 60, loss = 0.0150
Iteration 80, loss = 0.0222
--- Epoch 114 / 1000
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0140
Iteration 40, loss = 0.0222
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0261
--- Epoch 115 / 1000
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0191
Iteration 80, loss = 0.0209
--- Epoch 116 / 1000
Iteration 0, loss = 0.0300
Iteration 20, loss = 0.0249
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0459
Iteration 80, loss = 0.0109
--- Epoch 117 / 1000
Iteration 0, loss = 0.0176
Iteration 20, loss = 0.0265
Iteration 40, loss = 0.0221
Iteration 60, loss = 0.0160
Iteration 80, loss = 0.0171
--- Epoch 118 / 1000
Iteration 0, loss = 0.0171
Iteration 20, loss = 0.0378
Iteration 40, loss = 0.0164
Iteration 60, loss = 0.0121
Iteration 80, loss = 0.0188
--- Epoch 119 / 1000
Iteration 0, loss = 0.0280
Iteration 20, loss = 0.0366
Iteration 40, loss = 0.0196
Iteration 60, loss = 0.0166
Iteration 80, loss = 0.0177
--- Epoch 120 / 1000
Iteration 0, loss = 0.0197
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0167
Iteration 80, loss = 0.0121
--- Epoch 121 / 1000
Iteration 0, loss = 0.0181
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0249
Iteration 80, loss = 0.0279
--- Epoch 122 / 1000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0218
Iteration 60, loss = 0.0145
Iteration 80, loss = 0.0264
--- Epoch 123 / 1000
Iteration 0, loss = 0.0191
Iteration 20, loss = 0.0269
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0213
Iteration 80, loss = 0.0204
--- Epoch 124 / 1000
Iteration 0, loss = 0.0162
Iteration 20, loss = 0.0190
Iteration 40, loss = 0.0193
Iteration 60, loss = 0.0198
Iteration 80, loss = 0.0142
--- Epoch 125 / 1000
Iteration 0, loss = 0.0294
Iteration 20, loss = 0.0159
Iteration 40, loss = 0.0147
Iteration 60, loss = 0.0283
Iteration 80, loss = 0.0144
--- Epoch 126 / 1000
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0528
Iteration 80, loss = 0.0291
--- Epoch 127 / 1000
Iteration 0, loss = 0.0199
Iteration 20, loss = 0.0282
Iteration 40, loss = 0.0162
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0141
--- Epoch 128 / 1000
Iteration 0, loss = 0.0223
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0251
--- Epoch 129 / 1000
Iteration 0, loss = 0.0214
Iteration 20, loss = 0.0169
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0159
Iteration 80, loss = 0.0223
--- Epoch 130 / 1000
Iteration 0, loss = 0.0135
Iteration 20, loss = 0.0350
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0156
Iteration 80, loss = 0.0175
--- Epoch 131 / 1000
Iteration 0, loss = 0.0166
Iteration 20, loss = 0.0340
Iteration 40, loss = 0.0373
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0313
--- Epoch 132 / 1000
Iteration 0, loss = 0.0181
Iteration 20, loss = 0.0203
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0389
--- Epoch 133 / 1000
Iteration 0, loss = 0.0176
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0110
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0163
--- Epoch 134 / 1000
Iteration 0, loss = 0.0269
Iteration 20, loss = 0.0186
Iteration 40, loss = 0.0206
Iteration 60, loss = 0.0199
Iteration 80, loss = 0.0087
--- Epoch 135 / 1000
Iteration 0, loss = 0.0334
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0356
Iteration 80, loss = 0.0124
--- Epoch 136 / 1000
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0254
Iteration 40, loss = 0.0158
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0106
--- Epoch 137 / 1000
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0189
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0137
--- Epoch 138 / 1000
Iteration 0, loss = 0.0220
Iteration 20, loss = 0.0375
Iteration 40, loss = 0.0208
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0273
--- Epoch 139 / 1000
Iteration 0, loss = 0.0169
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0300
Iteration 80, loss = 0.0175
--- Epoch 140 / 1000
Iteration 0, loss = 0.0137
Iteration 20, loss = 0.0206
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0169
Iteration 80, loss = 0.0199
--- Epoch 141 / 1000
Iteration 0, loss = 0.0212
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0250
Iteration 80, loss = 0.0094
--- Epoch 142 / 1000
Iteration 0, loss = 0.0152
Iteration 20, loss = 0.0643
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0276
Iteration 80, loss = 0.0137
--- Epoch 143 / 1000
Iteration 0, loss = 0.0249
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0224
Iteration 80, loss = 0.0120
--- Epoch 144 / 1000
Iteration 0, loss = 0.0217
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0207
Iteration 60, loss = 0.0132
Iteration 80, loss = 0.0059
--- Epoch 145 / 1000
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0238
Iteration 60, loss = 0.0155
Iteration 80, loss = 0.0144
--- Epoch 146 / 1000
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0379
Iteration 40, loss = 0.0216
Iteration 60, loss = 0.0226
Iteration 80, loss = 0.0591
--- Epoch 147 / 1000
Iteration 0, loss = 0.0270
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0200
Iteration 80, loss = 0.0238
--- Epoch 148 / 1000
Iteration 0, loss = 0.0383
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0175
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0155
--- Epoch 149 / 1000
Iteration 0, loss = 0.0145
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0248
Iteration 80, loss = 0.0245
--- Epoch 150 / 1000
Iteration 0, loss = 0.0280
Iteration 20, loss = 0.0184
Iteration 40, loss = 0.0176
Iteration 60, loss = 0.0182
Iteration 80, loss = 0.0132
--- Epoch 151 / 1000
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0260
Iteration 80, loss = 0.0073
--- Epoch 152 / 1000
Iteration 0, loss = 0.0175
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0165
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0228
--- Epoch 153 / 1000
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0145
Iteration 40, loss = 0.0229
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0234
--- Epoch 154 / 1000
Iteration 0, loss = 0.0204
Iteration 20, loss = 0.0185
Iteration 40, loss = 0.0160
Iteration 60, loss = 0.0132
Iteration 80, loss = 0.0131
--- Epoch 155 / 1000
Iteration 0, loss = 0.0228
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0237
Iteration 80, loss = 0.0104
--- Epoch 156 / 1000
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0370
Iteration 40, loss = 0.0170
Iteration 60, loss = 0.0217
Iteration 80, loss = 0.0153
--- Epoch 157 / 1000
Iteration 0, loss = 0.0184
Iteration 20, loss = 0.0155
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0199
Iteration 80, loss = 0.0119
--- Epoch 158 / 1000
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0164
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0160
Iteration 80, loss = 0.0396
--- Epoch 159 / 1000
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0238
Iteration 60, loss = 0.0293
Iteration 80, loss = 0.0063
--- Epoch 160 / 1000
Iteration 0, loss = 0.0252
Iteration 20, loss = 0.0167
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0262
--- Epoch 161 / 1000
Iteration 0, loss = 0.0194
Iteration 20, loss = 0.0164
Iteration 40, loss = 0.0148
Iteration 60, loss = 0.0281
Iteration 80, loss = 0.0145
--- Epoch 162 / 1000
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0260
Iteration 60, loss = 0.0153
Iteration 80, loss = 0.0364
--- Epoch 163 / 1000
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0160
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0066
--- Epoch 164 / 1000
Iteration 0, loss = 0.0145
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0118
--- Epoch 165 / 1000
Iteration 0, loss = 0.0304
Iteration 20, loss = 0.0169
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0185
Iteration 80, loss = 0.0248
--- Epoch 166 / 1000
Iteration 0, loss = 0.0162
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0176
Iteration 60, loss = 0.0192
Iteration 80, loss = 0.0245
--- Epoch 167 / 1000
Iteration 0, loss = 0.0245
Iteration 20, loss = 0.0181
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0337
Iteration 80, loss = 0.0207
--- Epoch 168 / 1000
Iteration 0, loss = 0.0191
Iteration 20, loss = 0.0278
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0073
--- Epoch 169 / 1000
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0262
Iteration 60, loss = 0.0190
Iteration 80, loss = 0.0077
--- Epoch 170 / 1000
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0335
Iteration 40, loss = 0.0314
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0268
--- Epoch 171 / 1000
Iteration 0, loss = 0.0101
Iteration 20, loss = 0.0154
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0156
--- Epoch 172 / 1000
Iteration 0, loss = 0.0191
Iteration 20, loss = 0.0230
Iteration 40, loss = 0.0145
Iteration 60, loss = 0.0316
Iteration 80, loss = 0.0074
--- Epoch 173 / 1000
Iteration 0, loss = 0.0232
Iteration 20, loss = 0.0144
Iteration 40, loss = 0.0460
Iteration 60, loss = 0.0155
Iteration 80, loss = 0.0123
--- Epoch 174 / 1000
Iteration 0, loss = 0.0126
Iteration 20, loss = 0.0222
Iteration 40, loss = 0.0188
Iteration 60, loss = 0.0230
Iteration 80, loss = 0.0069
--- Epoch 175 / 1000
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0137
Iteration 60, loss = 0.0151
Iteration 80, loss = 0.0121
--- Epoch 176 / 1000
Iteration 0, loss = 0.0166
Iteration 20, loss = 0.0241
Iteration 40, loss = 0.0164
Iteration 60, loss = 0.0153
Iteration 80, loss = 0.0182
--- Epoch 177 / 1000
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0307
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0159
--- Epoch 178 / 1000
Iteration 0, loss = 0.0263
Iteration 20, loss = 0.0155
Iteration 40, loss = 0.0272
Iteration 60, loss = 0.0201
Iteration 80, loss = 0.0059
--- Epoch 179 / 1000
Iteration 0, loss = 0.0123
Iteration 20, loss = 0.0162
Iteration 40, loss = 0.0110
Iteration 60, loss = 0.0307
Iteration 80, loss = 0.0049
--- Epoch 180 / 1000
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0127
Iteration 80, loss = 0.0112
--- Epoch 181 / 1000
Iteration 0, loss = 0.0192
Iteration 20, loss = 0.0108
Iteration 40, loss = 0.0206
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0184
--- Epoch 182 / 1000
Iteration 0, loss = 0.0192
Iteration 20, loss = 0.0307
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0128
--- Epoch 183 / 1000
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0293
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0131
Iteration 80, loss = 0.0149
--- Epoch 184 / 1000
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0228
Iteration 40, loss = 0.0303
Iteration 60, loss = 0.0160
Iteration 80, loss = 0.0105
--- Epoch 185 / 1000
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0146
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0165
Iteration 80, loss = 0.0125
--- Epoch 186 / 1000
Iteration 0, loss = 0.0440
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0121
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0230
--- Epoch 187 / 1000
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0193
Iteration 60, loss = 0.0202
Iteration 80, loss = 0.0107
--- Epoch 188 / 1000
Iteration 0, loss = 0.0127
Iteration 20, loss = 0.0243
Iteration 40, loss = 0.0134
Iteration 60, loss = 0.0266
Iteration 80, loss = 0.0328
--- Epoch 189 / 1000
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0266
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0060
--- Epoch 190 / 1000
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0161
--- Epoch 191 / 1000
Iteration 0, loss = 0.0304
Iteration 20, loss = 0.0183
Iteration 40, loss = 0.0206
Iteration 60, loss = 0.0115
Iteration 80, loss = 0.0063
--- Epoch 192 / 1000
Iteration 0, loss = 0.0220
Iteration 20, loss = 0.0219
Iteration 40, loss = 0.0113
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0161
--- Epoch 193 / 1000
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0196
Iteration 40, loss = 0.0212
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0311
--- Epoch 194 / 1000
Iteration 0, loss = 0.0276
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0115
Iteration 80, loss = 0.0208
--- Epoch 195 / 1000
Iteration 0, loss = 0.0221
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0192
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0159
--- Epoch 196 / 1000
Iteration 0, loss = 0.0167
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0155
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0127
--- Epoch 197 / 1000
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0164
--- Epoch 198 / 1000
Iteration 0, loss = 0.0259
Iteration 20, loss = 0.0160
Iteration 40, loss = 0.0202
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0210
--- Epoch 199 / 1000
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0284
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0247
Iteration 80, loss = 0.0133
--- Epoch 200 / 1000
Iteration 0, loss = 0.0469
Iteration 20, loss = 0.0213
Iteration 40, loss = 0.0273
Iteration 60, loss = 0.0190
Iteration 80, loss = 0.0060
--- Epoch 201 / 1000
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0141
Iteration 60, loss = 0.0148
Iteration 80, loss = 0.0084
--- Epoch 202 / 1000
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0184
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0161
--- Epoch 203 / 1000
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0271
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0040
--- Epoch 204 / 1000
Iteration 0, loss = 0.0173
Iteration 20, loss = 0.0175
Iteration 40, loss = 0.0192
Iteration 60, loss = 0.0202
Iteration 80, loss = 0.0169
--- Epoch 205 / 1000
Iteration 0, loss = 0.0246
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0195
Iteration 60, loss = 0.0101
Iteration 80, loss = 0.0103
--- Epoch 206 / 1000
Iteration 0, loss = 0.0179
Iteration 20, loss = 0.0162
Iteration 40, loss = 0.0189
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0248
--- Epoch 207 / 1000
Iteration 0, loss = 0.0238
Iteration 20, loss = 0.0155
Iteration 40, loss = 0.0245
Iteration 60, loss = 0.0267
Iteration 80, loss = 0.0070
--- Epoch 208 / 1000
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0175
Iteration 80, loss = 0.0144
--- Epoch 209 / 1000
Iteration 0, loss = 0.0298
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0256
Iteration 60, loss = 0.0217
Iteration 80, loss = 0.0206
--- Epoch 210 / 1000
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0136
Iteration 40, loss = 0.0147
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0139
--- Epoch 211 / 1000
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0232
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0180
Iteration 80, loss = 0.0102
--- Epoch 212 / 1000
Iteration 0, loss = 0.0171
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0264
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0261
--- Epoch 213 / 1000
Iteration 0, loss = 0.0229
Iteration 20, loss = 0.0312
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0297
Iteration 80, loss = 0.0051
--- Epoch 214 / 1000
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0128
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0196
Iteration 80, loss = 0.0158
--- Epoch 215 / 1000
Iteration 0, loss = 0.0205
Iteration 20, loss = 0.0127
Iteration 40, loss = 0.0268
Iteration 60, loss = 0.0233
Iteration 80, loss = 0.0079
--- Epoch 216 / 1000
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0308
Iteration 40, loss = 0.0163
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0090
--- Epoch 217 / 1000
Iteration 0, loss = 0.0237
Iteration 20, loss = 0.0301
Iteration 40, loss = 0.0296
Iteration 60, loss = 0.0244
Iteration 80, loss = 0.0180
--- Epoch 218 / 1000
Iteration 0, loss = 0.0538
Iteration 20, loss = 0.0220
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0116
Iteration 80, loss = 0.0265
--- Epoch 219 / 1000
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0236
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0164
Iteration 80, loss = 0.0149
--- Epoch 220 / 1000
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0145
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0120
--- Epoch 221 / 1000
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0179
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0272
Iteration 80, loss = 0.0098
--- Epoch 222 / 1000
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0266
Iteration 40, loss = 0.0186
Iteration 60, loss = 0.0237
Iteration 80, loss = 0.0101
--- Epoch 223 / 1000
Iteration 0, loss = 0.0256
Iteration 20, loss = 0.0141
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0065
--- Epoch 224 / 1000
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0229
Iteration 40, loss = 0.0201
Iteration 60, loss = 0.0190
Iteration 80, loss = 0.0219
--- Epoch 225 / 1000
Iteration 0, loss = 0.0222
Iteration 20, loss = 0.0282
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0220
Iteration 80, loss = 0.0170
--- Epoch 226 / 1000
Iteration 0, loss = 0.0204
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0179
Iteration 60, loss = 0.0134
Iteration 80, loss = 0.0075
--- Epoch 227 / 1000
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0240
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0191
Iteration 80, loss = 0.0167
--- Epoch 228 / 1000
Iteration 0, loss = 0.0162
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0166
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0075
--- Epoch 229 / 1000
Iteration 0, loss = 0.0141
Iteration 20, loss = 0.0133
Iteration 40, loss = 0.0213
Iteration 60, loss = 0.0248
Iteration 80, loss = 0.0092
--- Epoch 230 / 1000
Iteration 0, loss = 0.0136
Iteration 20, loss = 0.0198
Iteration 40, loss = 0.0220
Iteration 60, loss = 0.0225
Iteration 80, loss = 0.0095
--- Epoch 231 / 1000
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0265
Iteration 40, loss = 0.0133
Iteration 60, loss = 0.0215
Iteration 80, loss = 0.0288
--- Epoch 232 / 1000
Iteration 0, loss = 0.0196
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0197
Iteration 80, loss = 0.0120
--- Epoch 233 / 1000
Iteration 0, loss = 0.0237
Iteration 20, loss = 0.0243
Iteration 40, loss = 0.0146
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0215
--- Epoch 234 / 1000
Iteration 0, loss = 0.0184
Iteration 20, loss = 0.0145
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0221
Iteration 80, loss = 0.0166
--- Epoch 235 / 1000
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0207
Iteration 40, loss = 0.0217
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0160
--- Epoch 236 / 1000
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0236
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0201
--- Epoch 237 / 1000
Iteration 0, loss = 0.0232
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0093
--- Epoch 238 / 1000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0105
--- Epoch 239 / 1000
Iteration 0, loss = 0.0123
Iteration 20, loss = 0.0262
Iteration 40, loss = 0.0404
Iteration 60, loss = 0.0362
Iteration 80, loss = 0.0149
--- Epoch 240 / 1000
Iteration 0, loss = 0.0219
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0133
Iteration 60, loss = 0.0220
Iteration 80, loss = 0.0100
--- Epoch 241 / 1000
Iteration 0, loss = 0.0170
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0166
Iteration 80, loss = 0.0144
--- Epoch 242 / 1000
Iteration 0, loss = 0.0230
Iteration 20, loss = 0.0159
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0177
Iteration 80, loss = 0.0113
--- Epoch 243 / 1000
Iteration 0, loss = 0.0202
Iteration 20, loss = 0.0146
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0061
--- Epoch 244 / 1000
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0208
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0215
Iteration 80, loss = 0.0092
--- Epoch 245 / 1000
Iteration 0, loss = 0.0185
Iteration 20, loss = 0.0276
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0099
--- Epoch 246 / 1000
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0189
--- Epoch 247 / 1000
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0198
Iteration 80, loss = 0.0210
--- Epoch 248 / 1000
Iteration 0, loss = 0.0135
Iteration 20, loss = 0.0148
Iteration 40, loss = 0.0134
Iteration 60, loss = 0.0136
Iteration 80, loss = 0.0217
--- Epoch 249 / 1000
Iteration 0, loss = 0.0266
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0198
Iteration 60, loss = 0.0244
Iteration 80, loss = 0.0160
--- Epoch 250 / 1000
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0201
Iteration 40, loss = 0.0355
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0152
--- Epoch 251 / 1000
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0283
Iteration 40, loss = 0.0159
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0103
--- Epoch 252 / 1000
Iteration 0, loss = 0.0180
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0175
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0175
--- Epoch 253 / 1000
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0252
--- Epoch 254 / 1000
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0157
Iteration 80, loss = 0.0092
--- Epoch 255 / 1000
Iteration 0, loss = 0.0236
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0261
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0078
--- Epoch 256 / 1000
Iteration 0, loss = 0.0161
Iteration 20, loss = 0.0151
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0181
Iteration 80, loss = 0.0109
--- Epoch 257 / 1000
Iteration 0, loss = 0.0181
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0205
Iteration 60, loss = 0.0290
Iteration 80, loss = 0.0107
--- Epoch 258 / 1000
Iteration 0, loss = 0.0097
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0137
Iteration 60, loss = 0.0120
Iteration 80, loss = 0.0153
--- Epoch 259 / 1000
Iteration 0, loss = 0.0135
Iteration 20, loss = 0.0253
Iteration 40, loss = 0.0175
Iteration 60, loss = 0.0205
Iteration 80, loss = 0.0199
--- Epoch 260 / 1000
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0286
Iteration 40, loss = 0.0129
Iteration 60, loss = 0.0216
Iteration 80, loss = 0.0232
--- Epoch 261 / 1000
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0155
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0131
--- Epoch 262 / 1000
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0181
Iteration 40, loss = 0.0133
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0137
--- Epoch 263 / 1000
Iteration 0, loss = 0.0203
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0337
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0056
--- Epoch 264 / 1000
Iteration 0, loss = 0.0312
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0168
Iteration 60, loss = 0.0228
Iteration 80, loss = 0.0194
--- Epoch 265 / 1000
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0135
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0236
--- Epoch 266 / 1000
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0186
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0111
--- Epoch 267 / 1000
Iteration 0, loss = 0.0168
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0048
--- Epoch 268 / 1000
Iteration 0, loss = 0.0127
Iteration 20, loss = 0.0193
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0277
--- Epoch 269 / 1000
Iteration 0, loss = 0.0232
Iteration 20, loss = 0.0270
Iteration 40, loss = 0.0139
Iteration 60, loss = 0.0187
Iteration 80, loss = 0.0129
--- Epoch 270 / 1000
Iteration 0, loss = 0.0186
Iteration 20, loss = 0.0209
Iteration 40, loss = 0.0183
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0120
--- Epoch 271 / 1000
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0201
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0118
--- Epoch 272 / 1000
Iteration 0, loss = 0.0131
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0208
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0174
--- Epoch 273 / 1000
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0131
Iteration 40, loss = 0.0134
Iteration 60, loss = 0.0183
Iteration 80, loss = 0.0300
--- Epoch 274 / 1000
Iteration 0, loss = 0.0212
Iteration 20, loss = 0.0179
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0056
--- Epoch 275 / 1000
Iteration 0, loss = 0.0126
Iteration 20, loss = 0.0252
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0070
--- Epoch 276 / 1000
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0215
Iteration 80, loss = 0.0168
--- Epoch 277 / 1000
Iteration 0, loss = 0.0131
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0260
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0129
--- Epoch 278 / 1000
Iteration 0, loss = 0.0178
Iteration 20, loss = 0.0166
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0350
Iteration 80, loss = 0.0546
--- Epoch 279 / 1000
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0236
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0077
--- Epoch 280 / 1000
Iteration 0, loss = 0.0335
Iteration 20, loss = 0.0241
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0282
--- Epoch 281 / 1000
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0132
Iteration 80, loss = 0.0224
--- Epoch 282 / 1000
Iteration 0, loss = 0.0229
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0165
Iteration 60, loss = 0.0221
Iteration 80, loss = 0.0082
--- Epoch 283 / 1000
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0193
Iteration 60, loss = 0.0174
Iteration 80, loss = 0.0182
--- Epoch 284 / 1000
Iteration 0, loss = 0.0372
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0277
Iteration 60, loss = 0.0160
Iteration 80, loss = 0.0079
--- Epoch 285 / 1000
Iteration 0, loss = 0.0237
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0179
--- Epoch 286 / 1000
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0209
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0247
Iteration 80, loss = 0.0087
--- Epoch 287 / 1000
Iteration 0, loss = 0.0344
Iteration 20, loss = 0.0140
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0325
Iteration 80, loss = 0.0127
--- Epoch 288 / 1000
Iteration 0, loss = 0.0402
Iteration 20, loss = 0.0140
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0080
--- Epoch 289 / 1000
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0166
Iteration 80, loss = 0.0152
--- Epoch 290 / 1000
Iteration 0, loss = 0.0172
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0131
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0154
--- Epoch 291 / 1000
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0159
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0168
--- Epoch 292 / 1000
Iteration 0, loss = 0.0157
Iteration 20, loss = 0.0188
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0224
Iteration 80, loss = 0.0142
--- Epoch 293 / 1000
Iteration 0, loss = 0.0289
Iteration 20, loss = 0.0259
Iteration 40, loss = 0.0168
Iteration 60, loss = 0.0370
Iteration 80, loss = 0.0158
--- Epoch 294 / 1000
Iteration 0, loss = 0.0210
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0247
Iteration 80, loss = 0.0246
--- Epoch 295 / 1000
Iteration 0, loss = 0.0084
Iteration 20, loss = 0.0176
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0173
Iteration 80, loss = 0.0089
--- Epoch 296 / 1000
Iteration 0, loss = 0.0162
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0154
Iteration 80, loss = 0.0064
--- Epoch 297 / 1000
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0152
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0119
--- Epoch 298 / 1000
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0186
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0302
Iteration 80, loss = 0.0127
--- Epoch 299 / 1000
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0201
Iteration 80, loss = 0.0175
--- Epoch 300 / 1000
Iteration 0, loss = 0.0141
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0202
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0190
--- Epoch 301 / 1000
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0136
Iteration 40, loss = 0.0231
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0142
--- Epoch 302 / 1000
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0154
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0137
--- Epoch 303 / 1000
Iteration 0, loss = 0.0194
Iteration 20, loss = 0.0133
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0111
--- Epoch 304 / 1000
Iteration 0, loss = 0.0123
Iteration 20, loss = 0.0386
Iteration 40, loss = 0.0202
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0303
--- Epoch 305 / 1000
Iteration 0, loss = 0.0163
Iteration 20, loss = 0.0195
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0187
Iteration 80, loss = 0.0164
--- Epoch 306 / 1000
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0163
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0060
--- Epoch 307 / 1000
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0025
--- Epoch 308 / 1000
Iteration 0, loss = 0.0272
Iteration 20, loss = 0.0133
Iteration 40, loss = 0.0147
Iteration 60, loss = 0.0144
Iteration 80, loss = 0.0179
--- Epoch 309 / 1000
Iteration 0, loss = 0.0277
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0181
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0047
--- Epoch 310 / 1000
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0144
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0205
--- Epoch 311 / 1000
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0137
Iteration 60, loss = 0.0172
Iteration 80, loss = 0.0197
--- Epoch 312 / 1000
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0130
--- Epoch 313 / 1000
Iteration 0, loss = 0.0190
Iteration 20, loss = 0.0161
Iteration 40, loss = 0.0208
Iteration 60, loss = 0.0214
Iteration 80, loss = 0.0053
--- Epoch 314 / 1000
Iteration 0, loss = 0.0145
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0161
Iteration 60, loss = 0.0202
Iteration 80, loss = 0.0238
--- Epoch 315 / 1000
Iteration 0, loss = 0.0204
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0303
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0205
--- Epoch 316 / 1000
Iteration 0, loss = 0.0221
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0194
Iteration 60, loss = 0.0120
Iteration 80, loss = 0.0189
--- Epoch 317 / 1000
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0136
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0232
Iteration 80, loss = 0.0214
--- Epoch 318 / 1000
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0184
Iteration 80, loss = 0.0049
--- Epoch 319 / 1000
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0112
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0175
Iteration 80, loss = 0.0059
--- Epoch 320 / 1000
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0224
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0204
--- Epoch 321 / 1000
Iteration 0, loss = 0.0277
Iteration 20, loss = 0.0209
Iteration 40, loss = 0.0225
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0096
--- Epoch 322 / 1000
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0179
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0180
Iteration 80, loss = 0.0133
--- Epoch 323 / 1000
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0156
Iteration 80, loss = 0.0084
--- Epoch 324 / 1000
Iteration 0, loss = 0.0145
Iteration 20, loss = 0.0192
Iteration 40, loss = 0.0262
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0457
--- Epoch 325 / 1000
Iteration 0, loss = 0.0150
Iteration 20, loss = 0.0275
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0222
Iteration 80, loss = 0.0145
--- Epoch 326 / 1000
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0210
--- Epoch 327 / 1000
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0232
Iteration 60, loss = 0.0125
Iteration 80, loss = 0.0197
--- Epoch 328 / 1000
Iteration 0, loss = 0.0551
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0192
Iteration 60, loss = 0.0187
Iteration 80, loss = 0.0150
--- Epoch 329 / 1000
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0173
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0243
Iteration 80, loss = 0.0179
--- Epoch 330 / 1000
Iteration 0, loss = 0.0157
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0104
--- Epoch 331 / 1000
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0197
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0175
Iteration 80, loss = 0.0085
--- Epoch 332 / 1000
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0308
Iteration 40, loss = 0.0318
Iteration 60, loss = 0.0240
Iteration 80, loss = 0.0181
--- Epoch 333 / 1000
Iteration 0, loss = 0.0103
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0206
Iteration 60, loss = 0.0134
Iteration 80, loss = 0.0115
--- Epoch 334 / 1000
Iteration 0, loss = 0.0307
Iteration 20, loss = 0.0131
Iteration 40, loss = 0.0375
Iteration 60, loss = 0.0186
Iteration 80, loss = 0.0177
--- Epoch 335 / 1000
Iteration 0, loss = 0.0137
Iteration 20, loss = 0.0307
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0162
--- Epoch 336 / 1000
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0070
--- Epoch 337 / 1000
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0115
Iteration 40, loss = 0.0277
Iteration 60, loss = 0.0148
Iteration 80, loss = 0.0099
--- Epoch 338 / 1000
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0101
Iteration 80, loss = 0.0191
--- Epoch 339 / 1000
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0168
--- Epoch 340 / 1000
Iteration 0, loss = 0.0194
Iteration 20, loss = 0.0314
Iteration 40, loss = 0.0157
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0079
--- Epoch 341 / 1000
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0105
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0203
--- Epoch 342 / 1000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0366
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0095
--- Epoch 343 / 1000
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0122
--- Epoch 344 / 1000
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0182
Iteration 40, loss = 0.0919
Iteration 60, loss = 0.0258
Iteration 80, loss = 0.0122
--- Epoch 345 / 1000
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0128
Iteration 40, loss = 0.0221
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0086
--- Epoch 346 / 1000
Iteration 0, loss = 0.0197
Iteration 20, loss = 0.0131
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0093
--- Epoch 347 / 1000
Iteration 0, loss = 0.0179
Iteration 20, loss = 0.0179
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0202
Iteration 80, loss = 0.0127
--- Epoch 348 / 1000
Iteration 0, loss = 0.0138
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0160
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0186
--- Epoch 349 / 1000
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0204
Iteration 80, loss = 0.0260
--- Epoch 350 / 1000
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0325
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0147
--- Epoch 351 / 1000
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0225
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0057
--- Epoch 352 / 1000
Iteration 0, loss = 0.0138
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0064
--- Epoch 353 / 1000
Iteration 0, loss = 0.0169
Iteration 20, loss = 0.0312
Iteration 40, loss = 0.0237
Iteration 60, loss = 0.0281
Iteration 80, loss = 0.0115
--- Epoch 354 / 1000
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0179
Iteration 80, loss = 0.0218
--- Epoch 355 / 1000
Iteration 0, loss = 0.0191
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0075
--- Epoch 356 / 1000
Iteration 0, loss = 0.0224
Iteration 20, loss = 0.0302
Iteration 40, loss = 0.0152
Iteration 60, loss = 0.0347
Iteration 80, loss = 0.0147
--- Epoch 357 / 1000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0105
--- Epoch 358 / 1000
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0211
Iteration 80, loss = 0.0191
--- Epoch 359 / 1000
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0262
Iteration 80, loss = 0.0050
--- Epoch 360 / 1000
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0189
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0148
Iteration 80, loss = 0.0162
--- Epoch 361 / 1000
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0332
Iteration 60, loss = 0.0302
Iteration 80, loss = 0.0122
--- Epoch 362 / 1000
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0219
Iteration 80, loss = 0.0073
--- Epoch 363 / 1000
Iteration 0, loss = 0.0153
Iteration 20, loss = 0.0123
Iteration 40, loss = 0.0296
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0233
--- Epoch 364 / 1000
Iteration 0, loss = 0.0101
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0144
Iteration 80, loss = 0.0089
--- Epoch 365 / 1000
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0247
Iteration 80, loss = 0.0143
--- Epoch 366 / 1000
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0129
Iteration 40, loss = 0.0164
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0155
--- Epoch 367 / 1000
Iteration 0, loss = 0.0158
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0104
--- Epoch 368 / 1000
Iteration 0, loss = 0.0130
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0102
Iteration 80, loss = 0.0045
--- Epoch 369 / 1000
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0184
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0142
Iteration 80, loss = 0.0065
--- Epoch 370 / 1000
Iteration 0, loss = 0.0199
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0199
Iteration 80, loss = 0.0205
--- Epoch 371 / 1000
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0108
Iteration 40, loss = 0.0184
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0164
--- Epoch 372 / 1000
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0291
Iteration 60, loss = 0.0209
Iteration 80, loss = 0.0187
--- Epoch 373 / 1000
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0178
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0225
--- Epoch 374 / 1000
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0041
--- Epoch 375 / 1000
Iteration 0, loss = 0.0222
Iteration 20, loss = 0.0768
Iteration 40, loss = 0.0165
Iteration 60, loss = 0.0192
Iteration 80, loss = 0.0051
---------------------------------------------------------------------------
KeyboardInterrupt                         Traceback (most recent call last)
<ipython-input-215-506d6bf61503> in <module>
----> 1 train(model7, optimizer, epochs=1000, x_train=data["X_train_class"],  y_train=data["y_train_class"], criterion=custom_loss)

<ipython-input-164-7b479c5968e4> in train(model, optimizer, epochs, x_train, y_train, criterion)
     38             # This is the backwards pass: compute the gradient of the loss with
     39             # respect to each  parameter of the model.
---> 40             loss.backward()
     41 
     42             # Actually update the parameters of the model using the gradients

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/tensor.py in backward(self, gradient, retain_graph, create_graph)
    183                 products. Defaults to ``False``.
    184         """
--> 185         torch.autograd.backward(self, gradient, retain_graph, create_graph)
    186 
    187     def register_hook(self, hook):

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/autograd/__init__.py in backward(tensors, grad_tensors, retain_graph, create_graph, grad_variables)
    125     Variable._execution_engine.run_backward(
    126         tensors, grad_tensors, retain_graph, create_graph,
--> 127         allow_unreachable=True)  # allow_unreachable flag
    128 
    129 

KeyboardInterrupt: 
In [7]:
testModel(model7, x_test=data["X_test_ship"], y_test=data["y_test_ship"])
---------------------------------------------------------------------------
NameError                                 Traceback (most recent call last)
<ipython-input-7-655c38579b03> in <module>
----> 1 testModel(model7, x_test=data["X_test_ship"], y_test=data["y_test_ship"])

NameError: name 'testModel' is not defined
In [559]:
class ConvNet3(nn.Module):
    def __init__(self):
        super().__init__()
        self.epochsTrained = 0
          
        self.batchnorm1 = nn.BatchNorm2d(32)
        self.batchnorm2 = nn.BatchNorm2d(64)
        self.batchnorm3 = nn.BatchNorm2d(128)
        self.batchnorm4 = nn.BatchNorm2d(128)
        self.batchnorm5 = nn.BatchNorm2d(64)
        self.batchnorm6 = nn.BatchNorm2d(32)
          
        self.upsample = nn.Upsample(scale_factor=2, mode='bilinear')
              
        self.conv1 = nn.Conv2d(1, 32, kernel_size=3, padding=1) 
        self.conv2 = nn.Conv2d(32, 64, kernel_size=3, stride=2, padding=1) 
        self.conv3 = nn.Conv2d(64, 128, kernel_size=3, stride=2, padding=1)
        self.conv4 = nn.Conv2d(128, 128, kernel_size=3, stride=2, padding=1) 
        self.conv5 = nn.Conv2d(128, 64, kernel_size=3, padding=1)
        self.conv6 = nn.Conv2d(64, 32, kernel_size=3, padding=1)
        self.conv7 = nn.Conv2d(32, 3, kernel_size=3, padding=1)
     
    def forward(self, x):
        x = x[0, :, :].unsqueeze(0).unsqueeze(0)
          
        # Encoder
        scores = F.relu(self.batchnorm1(self.conv1(x)))
        scores = F.relu(self.batchnorm2(self.conv2(scores)))
        scores = F.relu(self.batchnorm3(self.conv3(scores)))
        scores = F.relu(self.batchnorm4(self.conv4(scores)))
     
        # Decoder
        scores = self.upsample(scores)
        scores = F.relu(self.batchnorm5(self.conv5(scores)))
        scores = self.upsample(scores)
        scores = F.relu(self.batchnorm6(self.conv6(scores)))
        scores = self.upsample(scores)
        scores = torch.tanh(self.conv7(scores))
               
        return scores
In [560]:
learning_rate = 5e-2
model8 = ConvNet3()
optimizer = optim.SGD(model8.parameters(), lr=learning_rate)
In [561]:
train(model8, optimizer, epochs=100000, x_train=data["X_train_class"],  y_train=data["y_train_class"], criterion=nn.MSELoss())
--- Epoch 1 / 100000
Iteration 0, loss = 0.1976
Iteration 20, loss = 0.0927
Iteration 40, loss = 0.1733
Iteration 60, loss = 0.0530
Iteration 80, loss = 0.0337
--- Epoch 2 / 100000
Iteration 0, loss = 0.0477
Iteration 20, loss = 0.0444
Iteration 40, loss = 0.0882
Iteration 60, loss = 0.0287
Iteration 80, loss = 0.0167
--- Epoch 3 / 100000
Iteration 0, loss = 0.0318
Iteration 20, loss = 0.0313
Iteration 40, loss = 0.0402
Iteration 60, loss = 0.0319
Iteration 80, loss = 0.0271
--- Epoch 4 / 100000
Iteration 0, loss = 0.1399
Iteration 20, loss = 0.0340
Iteration 40, loss = 0.0406
Iteration 60, loss = 0.0521
Iteration 80, loss = 0.0920
--- Epoch 5 / 100000
Iteration 0, loss = 0.0605
Iteration 20, loss = 0.0213
Iteration 40, loss = 0.0415
Iteration 60, loss = 0.0706
Iteration 80, loss = 0.0520
--- Epoch 6 / 100000
Iteration 0, loss = 0.0535
Iteration 20, loss = 0.0244
Iteration 40, loss = 0.0672
Iteration 60, loss = 0.0459
Iteration 80, loss = 0.0288
--- Epoch 7 / 100000
Iteration 0, loss = 0.0341
Iteration 20, loss = 0.0614
Iteration 40, loss = 0.0282
Iteration 60, loss = 0.0438
Iteration 80, loss = 0.0370
--- Epoch 8 / 100000
Iteration 0, loss = 0.0380
Iteration 20, loss = 0.0354
Iteration 40, loss = 0.0258
Iteration 60, loss = 0.0358
Iteration 80, loss = 0.0340
--- Epoch 9 / 100000
Iteration 0, loss = 0.0496
Iteration 20, loss = 0.0540
Iteration 40, loss = 0.0313
Iteration 60, loss = 0.0265
Iteration 80, loss = 0.0287
--- Epoch 10 / 100000
Iteration 0, loss = 0.0360
Iteration 20, loss = 0.0247
Iteration 40, loss = 0.0380
Iteration 60, loss = 0.0584
Iteration 80, loss = 0.0485
--- Epoch 11 / 100000
Iteration 0, loss = 0.0334
Iteration 20, loss = 0.0365
Iteration 40, loss = 0.0245
Iteration 60, loss = 0.0408
Iteration 80, loss = 0.0423
--- Epoch 12 / 100000
Iteration 0, loss = 0.0347
Iteration 20, loss = 0.0254
Iteration 40, loss = 0.0262
Iteration 60, loss = 0.0203
Iteration 80, loss = 0.0754
--- Epoch 13 / 100000
Iteration 0, loss = 0.0351
Iteration 20, loss = 0.0237
Iteration 40, loss = 0.0437
Iteration 60, loss = 0.0341
Iteration 80, loss = 0.0482
--- Epoch 14 / 100000
Iteration 0, loss = 0.0326
Iteration 20, loss = 0.1028
Iteration 40, loss = 0.0316
Iteration 60, loss = 0.0360
Iteration 80, loss = 0.0439
--- Epoch 15 / 100000
Iteration 0, loss = 0.0764
Iteration 20, loss = 0.0274
Iteration 40, loss = 0.0196
Iteration 60, loss = 0.0262
Iteration 80, loss = 0.0331
--- Epoch 16 / 100000
Iteration 0, loss = 0.0450
Iteration 20, loss = 0.0352
Iteration 40, loss = 0.0206
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0636
--- Epoch 17 / 100000
Iteration 0, loss = 0.0328
Iteration 20, loss = 0.0384
Iteration 40, loss = 0.0201
Iteration 60, loss = 0.0609
Iteration 80, loss = 0.0288
--- Epoch 18 / 100000
Iteration 0, loss = 0.0740
Iteration 20, loss = 0.0288
Iteration 40, loss = 0.0257
Iteration 60, loss = 0.0446
Iteration 80, loss = 0.0555
--- Epoch 19 / 100000
Iteration 0, loss = 0.0608
Iteration 20, loss = 0.0210
Iteration 40, loss = 0.0368
Iteration 60, loss = 0.0220
Iteration 80, loss = 0.0565
--- Epoch 20 / 100000
Iteration 0, loss = 0.0355
Iteration 20, loss = 0.0769
Iteration 40, loss = 0.0236
Iteration 60, loss = 0.0232
Iteration 80, loss = 0.0690
--- Epoch 21 / 100000
Iteration 0, loss = 0.0260
Iteration 20, loss = 0.0500
Iteration 40, loss = 0.0284
Iteration 60, loss = 0.0251
Iteration 80, loss = 0.0297
--- Epoch 22 / 100000
Iteration 0, loss = 0.0381
Iteration 20, loss = 0.0148
Iteration 40, loss = 0.0207
Iteration 60, loss = 0.0218
Iteration 80, loss = 0.0194
--- Epoch 23 / 100000
Iteration 0, loss = 0.0172
Iteration 20, loss = 0.0309
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0252
Iteration 80, loss = 0.0331
--- Epoch 24 / 100000
Iteration 0, loss = 0.0360
Iteration 20, loss = 0.0739
Iteration 40, loss = 0.0271
Iteration 60, loss = 0.0274
Iteration 80, loss = 0.0224
--- Epoch 25 / 100000
Iteration 0, loss = 0.0675
Iteration 20, loss = 0.0219
Iteration 40, loss = 0.0374
Iteration 60, loss = 0.0255
Iteration 80, loss = 0.0583
--- Epoch 26 / 100000
Iteration 0, loss = 0.0353
Iteration 20, loss = 0.0301
Iteration 40, loss = 0.0452
Iteration 60, loss = 0.0239
Iteration 80, loss = 0.0224
--- Epoch 27 / 100000
Iteration 0, loss = 0.0582
Iteration 20, loss = 0.0410
Iteration 40, loss = 0.0372
Iteration 60, loss = 0.0138
Iteration 80, loss = 0.0599
--- Epoch 28 / 100000
Iteration 0, loss = 0.0430
Iteration 20, loss = 0.0259
Iteration 40, loss = 0.0174
Iteration 60, loss = 0.0475
Iteration 80, loss = 0.0303
--- Epoch 29 / 100000
Iteration 0, loss = 0.0277
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0263
Iteration 60, loss = 0.0296
Iteration 80, loss = 0.0255
--- Epoch 30 / 100000
Iteration 0, loss = 0.0309
Iteration 20, loss = 0.0323
Iteration 40, loss = 0.0285
Iteration 60, loss = 0.0521
Iteration 80, loss = 0.0162
--- Epoch 31 / 100000
Iteration 0, loss = 0.0313
Iteration 20, loss = 0.0175
Iteration 40, loss = 0.0211
Iteration 60, loss = 0.0433
Iteration 80, loss = 0.0287
--- Epoch 32 / 100000
Iteration 0, loss = 0.0298
Iteration 20, loss = 0.0414
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0536
Iteration 80, loss = 0.0246
--- Epoch 33 / 100000
Iteration 0, loss = 0.0730
Iteration 20, loss = 0.0395
Iteration 40, loss = 0.0476
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0332
--- Epoch 34 / 100000
Iteration 0, loss = 0.0482
Iteration 20, loss = 0.0509
Iteration 40, loss = 0.0369
Iteration 60, loss = 0.0318
Iteration 80, loss = 0.0278
--- Epoch 35 / 100000
Iteration 0, loss = 0.0236
Iteration 20, loss = 0.0674
Iteration 40, loss = 0.0588
Iteration 60, loss = 0.0473
Iteration 80, loss = 0.0314
--- Epoch 36 / 100000
Iteration 0, loss = 0.0172
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0778
Iteration 60, loss = 0.0372
Iteration 80, loss = 0.0194
--- Epoch 37 / 100000
Iteration 0, loss = 0.0307
Iteration 20, loss = 0.0323
Iteration 40, loss = 0.0429
Iteration 60, loss = 0.0272
Iteration 80, loss = 0.0203
--- Epoch 38 / 100000
Iteration 0, loss = 0.0503
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0308
Iteration 60, loss = 0.0372
Iteration 80, loss = 0.0377
--- Epoch 39 / 100000
Iteration 0, loss = 0.0306
Iteration 20, loss = 0.0362
Iteration 40, loss = 0.0341
Iteration 60, loss = 0.0250
Iteration 80, loss = 0.0344
--- Epoch 40 / 100000
Iteration 0, loss = 0.0152
Iteration 20, loss = 0.0255
Iteration 40, loss = 0.0200
Iteration 60, loss = 0.0238
Iteration 80, loss = 0.0166
--- Epoch 41 / 100000
Iteration 0, loss = 0.0561
Iteration 20, loss = 0.0557
Iteration 40, loss = 0.0315
Iteration 60, loss = 0.0167
Iteration 80, loss = 0.0309
--- Epoch 42 / 100000
Iteration 0, loss = 0.0339
Iteration 20, loss = 0.0273
Iteration 40, loss = 0.0242
Iteration 60, loss = 0.0335
Iteration 80, loss = 0.0088
--- Epoch 43 / 100000
Iteration 0, loss = 0.0207
Iteration 20, loss = 0.0332
Iteration 40, loss = 0.0199
Iteration 60, loss = 0.0365
Iteration 80, loss = 0.0149
--- Epoch 44 / 100000
Iteration 0, loss = 0.0241
Iteration 20, loss = 0.0277
Iteration 40, loss = 0.0322
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0184
--- Epoch 45 / 100000
Iteration 0, loss = 0.0376
Iteration 20, loss = 0.0237
Iteration 40, loss = 0.0341
Iteration 60, loss = 0.0267
Iteration 80, loss = 0.0710
--- Epoch 46 / 100000
Iteration 0, loss = 0.0311
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0210
Iteration 60, loss = 0.0282
Iteration 80, loss = 0.0380
--- Epoch 47 / 100000
Iteration 0, loss = 0.0225
Iteration 20, loss = 0.0276
Iteration 40, loss = 0.0203
Iteration 60, loss = 0.0241
Iteration 80, loss = 0.0517
--- Epoch 48 / 100000
Iteration 0, loss = 0.0220
Iteration 20, loss = 0.0689
Iteration 40, loss = 0.0451
Iteration 60, loss = 0.0430
Iteration 80, loss = 0.0217
--- Epoch 49 / 100000
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0243
Iteration 40, loss = 0.0316
Iteration 60, loss = 0.0185
Iteration 80, loss = 0.0327
--- Epoch 50 / 100000
Iteration 0, loss = 0.0283
Iteration 20, loss = 0.0206
Iteration 40, loss = 0.0288
Iteration 60, loss = 0.0274
Iteration 80, loss = 0.0187
--- Epoch 51 / 100000
Iteration 0, loss = 0.0285
Iteration 20, loss = 0.0183
Iteration 40, loss = 0.0244
Iteration 60, loss = 0.0278
Iteration 80, loss = 0.0256
--- Epoch 52 / 100000
Iteration 0, loss = 0.0192
Iteration 20, loss = 0.0375
Iteration 40, loss = 0.0173
Iteration 60, loss = 0.0467
Iteration 80, loss = 0.0378
--- Epoch 53 / 100000
Iteration 0, loss = 0.0385
Iteration 20, loss = 0.0208
Iteration 40, loss = 0.0355
Iteration 60, loss = 0.0177
Iteration 80, loss = 0.0161
--- Epoch 54 / 100000
Iteration 0, loss = 0.0229
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0315
Iteration 60, loss = 0.0478
Iteration 80, loss = 0.0824
--- Epoch 55 / 100000
Iteration 0, loss = 0.0202
Iteration 20, loss = 0.0190
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0137
Iteration 80, loss = 0.0324
--- Epoch 56 / 100000
Iteration 0, loss = 0.0191
Iteration 20, loss = 0.0187
Iteration 40, loss = 0.0197
Iteration 60, loss = 0.0164
Iteration 80, loss = 0.0195
--- Epoch 57 / 100000
Iteration 0, loss = 0.0454
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0229
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0260
--- Epoch 58 / 100000
Iteration 0, loss = 0.0570
Iteration 20, loss = 0.0897
Iteration 40, loss = 0.0759
Iteration 60, loss = 0.0204
Iteration 80, loss = 0.0340
--- Epoch 59 / 100000
Iteration 0, loss = 0.0257
Iteration 20, loss = 0.0310
Iteration 40, loss = 0.0392
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0248
--- Epoch 60 / 100000
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0319
Iteration 40, loss = 0.0213
Iteration 60, loss = 0.0330
Iteration 80, loss = 0.0215
--- Epoch 61 / 100000
Iteration 0, loss = 0.0225
Iteration 20, loss = 0.0167
Iteration 40, loss = 0.0233
Iteration 60, loss = 0.0239
Iteration 80, loss = 0.0319
--- Epoch 62 / 100000
Iteration 0, loss = 0.0270
Iteration 20, loss = 0.0294
Iteration 40, loss = 0.0491
Iteration 60, loss = 0.0623
Iteration 80, loss = 0.0242
--- Epoch 63 / 100000
Iteration 0, loss = 0.0260
Iteration 20, loss = 0.0303
Iteration 40, loss = 0.0371
Iteration 60, loss = 0.0227
Iteration 80, loss = 0.0215
--- Epoch 64 / 100000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0332
Iteration 40, loss = 0.0287
Iteration 60, loss = 0.0266
Iteration 80, loss = 0.0345
--- Epoch 65 / 100000
Iteration 0, loss = 0.0283
Iteration 20, loss = 0.0217
Iteration 40, loss = 0.0406
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0389
--- Epoch 66 / 100000
Iteration 0, loss = 0.0226
Iteration 20, loss = 0.0322
Iteration 40, loss = 0.0352
Iteration 60, loss = 0.0248
Iteration 80, loss = 0.0280
--- Epoch 67 / 100000
Iteration 0, loss = 0.0285
Iteration 20, loss = 0.0263
Iteration 40, loss = 0.0181
Iteration 60, loss = 0.0156
Iteration 80, loss = 0.0253
--- Epoch 68 / 100000
Iteration 0, loss = 0.0392
Iteration 20, loss = 0.0395
Iteration 40, loss = 0.0183
Iteration 60, loss = 0.0287
Iteration 80, loss = 0.0183
--- Epoch 69 / 100000
Iteration 0, loss = 0.0332
Iteration 20, loss = 0.0385
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0229
Iteration 80, loss = 0.0363
--- Epoch 70 / 100000
Iteration 0, loss = 0.0212
Iteration 20, loss = 0.0185
Iteration 40, loss = 0.0277
Iteration 60, loss = 0.0171
Iteration 80, loss = 0.0144
--- Epoch 71 / 100000
Iteration 0, loss = 0.0285
Iteration 20, loss = 0.0099
Iteration 40, loss = 0.0290
Iteration 60, loss = 0.0198
Iteration 80, loss = 0.0247
--- Epoch 72 / 100000
Iteration 0, loss = 0.0381
Iteration 20, loss = 0.0227
Iteration 40, loss = 0.0326
Iteration 60, loss = 0.0121
Iteration 80, loss = 0.0179
--- Epoch 73 / 100000
Iteration 0, loss = 0.0402
Iteration 20, loss = 0.0261
Iteration 40, loss = 0.0379
Iteration 60, loss = 0.0181
Iteration 80, loss = 0.0308
--- Epoch 74 / 100000
Iteration 0, loss = 0.0251
Iteration 20, loss = 0.0297
Iteration 40, loss = 0.0208
Iteration 60, loss = 0.0305
Iteration 80, loss = 0.0356
--- Epoch 75 / 100000
Iteration 0, loss = 0.0310
Iteration 20, loss = 0.0190
Iteration 40, loss = 0.0249
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0238
--- Epoch 76 / 100000
Iteration 0, loss = 0.0275
Iteration 20, loss = 0.0329
Iteration 40, loss = 0.0217
Iteration 60, loss = 0.0305
Iteration 80, loss = 0.0284
--- Epoch 77 / 100000
Iteration 0, loss = 0.0220
Iteration 20, loss = 0.0245
Iteration 40, loss = 0.0403
Iteration 60, loss = 0.0206
Iteration 80, loss = 0.0242
--- Epoch 78 / 100000
Iteration 0, loss = 0.0239
Iteration 20, loss = 0.0199
Iteration 40, loss = 0.0417
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0430
--- Epoch 79 / 100000
Iteration 0, loss = 0.0256
Iteration 20, loss = 0.0243
Iteration 40, loss = 0.0357
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0177
--- Epoch 80 / 100000
Iteration 0, loss = 0.0210
Iteration 20, loss = 0.0531
Iteration 40, loss = 0.0184
Iteration 60, loss = 0.0169
Iteration 80, loss = 0.0487
--- Epoch 81 / 100000
Iteration 0, loss = 0.0206
Iteration 20, loss = 0.0164
Iteration 40, loss = 0.0191
Iteration 60, loss = 0.0179
Iteration 80, loss = 0.0157
--- Epoch 82 / 100000
Iteration 0, loss = 0.0194
Iteration 20, loss = 0.0216
Iteration 40, loss = 0.0312
Iteration 60, loss = 0.0270
Iteration 80, loss = 0.0436
--- Epoch 83 / 100000
Iteration 0, loss = 0.0171
Iteration 20, loss = 0.0294
Iteration 40, loss = 0.0332
Iteration 60, loss = 0.0247
Iteration 80, loss = 0.0224
--- Epoch 84 / 100000
Iteration 0, loss = 0.0260
Iteration 20, loss = 0.0207
Iteration 40, loss = 0.0165
Iteration 60, loss = 0.0264
Iteration 80, loss = 0.0151
--- Epoch 85 / 100000
Iteration 0, loss = 0.0211
Iteration 20, loss = 0.0254
Iteration 40, loss = 0.0105
Iteration 60, loss = 0.0221
Iteration 80, loss = 0.0168
--- Epoch 86 / 100000
Iteration 0, loss = 0.0250
Iteration 20, loss = 0.0250
Iteration 40, loss = 0.0197
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0146
--- Epoch 87 / 100000
Iteration 0, loss = 0.0265
Iteration 20, loss = 0.0162
Iteration 40, loss = 0.0204
Iteration 60, loss = 0.0237
Iteration 80, loss = 0.0191
--- Epoch 88 / 100000
Iteration 0, loss = 0.0210
Iteration 20, loss = 0.0311
Iteration 40, loss = 0.0146
Iteration 60, loss = 0.0142
Iteration 80, loss = 0.0300
--- Epoch 89 / 100000
Iteration 0, loss = 0.0158
Iteration 20, loss = 0.0232
Iteration 40, loss = 0.0157
Iteration 60, loss = 0.0246
Iteration 80, loss = 0.0397
--- Epoch 90 / 100000
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0137
Iteration 40, loss = 0.0238
Iteration 60, loss = 0.0288
Iteration 80, loss = 0.0212
--- Epoch 91 / 100000
Iteration 0, loss = 0.0264
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0165
Iteration 60, loss = 0.0286
Iteration 80, loss = 0.0231
--- Epoch 92 / 100000
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0360
Iteration 40, loss = 0.0284
Iteration 60, loss = 0.0213
Iteration 80, loss = 0.0144
--- Epoch 93 / 100000
Iteration 0, loss = 0.0203
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0324
Iteration 60, loss = 0.0249
Iteration 80, loss = 0.0140
--- Epoch 94 / 100000
Iteration 0, loss = 0.0274
Iteration 20, loss = 0.0140
Iteration 40, loss = 0.0208
Iteration 60, loss = 0.0304
Iteration 80, loss = 0.0288
--- Epoch 95 / 100000
Iteration 0, loss = 0.0307
Iteration 20, loss = 0.0267
Iteration 40, loss = 0.0235
Iteration 60, loss = 0.0296
Iteration 80, loss = 0.0162
--- Epoch 96 / 100000
Iteration 0, loss = 0.0239
Iteration 20, loss = 0.0380
Iteration 40, loss = 0.0309
Iteration 60, loss = 0.0385
Iteration 80, loss = 0.0264
--- Epoch 97 / 100000
Iteration 0, loss = 0.0205
Iteration 20, loss = 0.0240
Iteration 40, loss = 0.0172
Iteration 60, loss = 0.0205
Iteration 80, loss = 0.0205
--- Epoch 98 / 100000
Iteration 0, loss = 0.0321
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0446
Iteration 60, loss = 0.0272
Iteration 80, loss = 0.0128
--- Epoch 99 / 100000
Iteration 0, loss = 0.0177
Iteration 20, loss = 0.0213
Iteration 40, loss = 0.0370
Iteration 60, loss = 0.0160
Iteration 80, loss = 0.0273
--- Epoch 100 / 100000
Iteration 0, loss = 0.0165
Iteration 20, loss = 0.0218
Iteration 40, loss = 0.0358
Iteration 60, loss = 0.0330
Iteration 80, loss = 0.0278
--- Epoch 101 / 100000
Iteration 0, loss = 0.0082
Iteration 20, loss = 0.0287
Iteration 40, loss = 0.0354
Iteration 60, loss = 0.0304
Iteration 80, loss = 0.0155
--- Epoch 102 / 100000
Iteration 0, loss = 0.0369
Iteration 20, loss = 0.0282
Iteration 40, loss = 0.0177
Iteration 60, loss = 0.0197
Iteration 80, loss = 0.0251
--- Epoch 103 / 100000
Iteration 0, loss = 0.0282
Iteration 20, loss = 0.0186
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0235
Iteration 80, loss = 0.0505
--- Epoch 104 / 100000
Iteration 0, loss = 0.0222
Iteration 20, loss = 0.0290
Iteration 40, loss = 0.0215
Iteration 60, loss = 0.0255
Iteration 80, loss = 0.0255
--- Epoch 105 / 100000
Iteration 0, loss = 0.0590
Iteration 20, loss = 0.0231
Iteration 40, loss = 0.0360
Iteration 60, loss = 0.0256
Iteration 80, loss = 0.0158
--- Epoch 106 / 100000
Iteration 0, loss = 0.0207
Iteration 20, loss = 0.0402
Iteration 40, loss = 0.0454
Iteration 60, loss = 0.0185
Iteration 80, loss = 0.0253
--- Epoch 107 / 100000
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0201
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0155
Iteration 80, loss = 0.0224
--- Epoch 108 / 100000
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0162
Iteration 40, loss = 0.0330
Iteration 60, loss = 0.0233
Iteration 80, loss = 0.0241
--- Epoch 109 / 100000
Iteration 0, loss = 0.0288
Iteration 20, loss = 0.0341
Iteration 40, loss = 0.0246
Iteration 60, loss = 0.0242
Iteration 80, loss = 0.0233
--- Epoch 110 / 100000
Iteration 0, loss = 0.0174
Iteration 20, loss = 0.0180
Iteration 40, loss = 0.0192
Iteration 60, loss = 0.0214
Iteration 80, loss = 0.0143
--- Epoch 111 / 100000
Iteration 0, loss = 0.0279
Iteration 20, loss = 0.0162
Iteration 40, loss = 0.0472
Iteration 60, loss = 0.0628
Iteration 80, loss = 0.0128
--- Epoch 112 / 100000
Iteration 0, loss = 0.0282
Iteration 20, loss = 0.0173
Iteration 40, loss = 0.0227
Iteration 60, loss = 0.0255
Iteration 80, loss = 0.0439
--- Epoch 113 / 100000
Iteration 0, loss = 0.0318
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0161
Iteration 60, loss = 0.0138
Iteration 80, loss = 0.0138
--- Epoch 114 / 100000
Iteration 0, loss = 0.0211
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0213
Iteration 80, loss = 0.0068
--- Epoch 115 / 100000
Iteration 0, loss = 0.0392
Iteration 20, loss = 0.0210
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0168
Iteration 80, loss = 0.0318
--- Epoch 116 / 100000
Iteration 0, loss = 0.0215
Iteration 20, loss = 0.0212
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0455
Iteration 80, loss = 0.0164
--- Epoch 117 / 100000
Iteration 0, loss = 0.0174
Iteration 20, loss = 0.0326
Iteration 40, loss = 0.0198
Iteration 60, loss = 0.0260
Iteration 80, loss = 0.0137
--- Epoch 118 / 100000
Iteration 0, loss = 0.0276
Iteration 20, loss = 0.0231
Iteration 40, loss = 0.0203
Iteration 60, loss = 0.0317
Iteration 80, loss = 0.0301
--- Epoch 119 / 100000
Iteration 0, loss = 0.0246
Iteration 20, loss = 0.0231
Iteration 40, loss = 0.0160
Iteration 60, loss = 0.0425
Iteration 80, loss = 0.0187
--- Epoch 120 / 100000
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0129
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0159
Iteration 80, loss = 0.0167
--- Epoch 121 / 100000
Iteration 0, loss = 0.0264
Iteration 20, loss = 0.0197
Iteration 40, loss = 0.0166
Iteration 60, loss = 0.0207
Iteration 80, loss = 0.0552
--- Epoch 122 / 100000
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0175
Iteration 40, loss = 0.0188
Iteration 60, loss = 0.0216
Iteration 80, loss = 0.0103
--- Epoch 123 / 100000
Iteration 0, loss = 0.0231
Iteration 20, loss = 0.0302
Iteration 40, loss = 0.0198
Iteration 60, loss = 0.0242
Iteration 80, loss = 0.0205
--- Epoch 124 / 100000
Iteration 0, loss = 0.0166
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0199
Iteration 60, loss = 0.0189
Iteration 80, loss = 0.0284
--- Epoch 125 / 100000
Iteration 0, loss = 0.0206
Iteration 20, loss = 0.0254
Iteration 40, loss = 0.0204
Iteration 60, loss = 0.0160
Iteration 80, loss = 0.0107
--- Epoch 126 / 100000
Iteration 0, loss = 0.0166
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0282
Iteration 60, loss = 0.0173
Iteration 80, loss = 0.0119
--- Epoch 127 / 100000
Iteration 0, loss = 0.0288
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0195
Iteration 60, loss = 0.0164
Iteration 80, loss = 0.0141
--- Epoch 128 / 100000
Iteration 0, loss = 0.0158
Iteration 20, loss = 0.0309
Iteration 40, loss = 0.0308
Iteration 60, loss = 0.0194
Iteration 80, loss = 0.0294
--- Epoch 129 / 100000
Iteration 0, loss = 0.0203
Iteration 20, loss = 0.0303
Iteration 40, loss = 0.0430
Iteration 60, loss = 0.0255
Iteration 80, loss = 0.0589
--- Epoch 130 / 100000
Iteration 0, loss = 0.0207
Iteration 20, loss = 0.0589
Iteration 40, loss = 0.0171
Iteration 60, loss = 0.0170
Iteration 80, loss = 0.0205
--- Epoch 131 / 100000
Iteration 0, loss = 0.0239
Iteration 20, loss = 0.0223
Iteration 40, loss = 0.0166
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0380
--- Epoch 132 / 100000
Iteration 0, loss = 0.0330
Iteration 20, loss = 0.0370
Iteration 40, loss = 0.0430
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0126
--- Epoch 133 / 100000
Iteration 0, loss = 0.0315
Iteration 20, loss = 0.0293
Iteration 40, loss = 0.0286
Iteration 60, loss = 0.0230
Iteration 80, loss = 0.0348
--- Epoch 134 / 100000
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0235
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0290
Iteration 80, loss = 0.0159
--- Epoch 135 / 100000
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0209
Iteration 60, loss = 0.0378
Iteration 80, loss = 0.0283
--- Epoch 136 / 100000
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0377
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0152
--- Epoch 137 / 100000
Iteration 0, loss = 0.0711
Iteration 20, loss = 0.0292
Iteration 40, loss = 0.0134
Iteration 60, loss = 0.0358
Iteration 80, loss = 0.0465
--- Epoch 138 / 100000
Iteration 0, loss = 0.0535
Iteration 20, loss = 0.0427
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0164
Iteration 80, loss = 0.0179
--- Epoch 139 / 100000
Iteration 0, loss = 0.0176
Iteration 20, loss = 0.0189
Iteration 40, loss = 0.0305
Iteration 60, loss = 0.0286
Iteration 80, loss = 0.0193
--- Epoch 140 / 100000
Iteration 0, loss = 0.0190
Iteration 20, loss = 0.0185
Iteration 40, loss = 0.0369
Iteration 60, loss = 0.0240
Iteration 80, loss = 0.0216
--- Epoch 141 / 100000
Iteration 0, loss = 0.0176
Iteration 20, loss = 0.0361
Iteration 40, loss = 0.0156
Iteration 60, loss = 0.0339
Iteration 80, loss = 0.0157
--- Epoch 142 / 100000
Iteration 0, loss = 0.0195
Iteration 20, loss = 0.0318
Iteration 40, loss = 0.0205
Iteration 60, loss = 0.0256
Iteration 80, loss = 0.0201
--- Epoch 143 / 100000
Iteration 0, loss = 0.0169
Iteration 20, loss = 0.0409
Iteration 40, loss = 0.0244
Iteration 60, loss = 0.0379
Iteration 80, loss = 0.0258
--- Epoch 144 / 100000
Iteration 0, loss = 0.0242
Iteration 20, loss = 0.0339
Iteration 40, loss = 0.0170
Iteration 60, loss = 0.0360
Iteration 80, loss = 0.0182
--- Epoch 145 / 100000
Iteration 0, loss = 0.0327
Iteration 20, loss = 0.0442
Iteration 40, loss = 0.0251
Iteration 60, loss = 0.0159
Iteration 80, loss = 0.0146
--- Epoch 146 / 100000
Iteration 0, loss = 0.0197
Iteration 20, loss = 0.0137
Iteration 40, loss = 0.0209
Iteration 60, loss = 0.0410
Iteration 80, loss = 0.0283
--- Epoch 147 / 100000
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0259
Iteration 40, loss = 0.0146
Iteration 60, loss = 0.0327
Iteration 80, loss = 0.0260
--- Epoch 148 / 100000
Iteration 0, loss = 0.0213
Iteration 20, loss = 0.0193
Iteration 40, loss = 0.0207
Iteration 60, loss = 0.0167
Iteration 80, loss = 0.0350
--- Epoch 149 / 100000
Iteration 0, loss = 0.0252
Iteration 20, loss = 0.0203
Iteration 40, loss = 0.0224
Iteration 60, loss = 0.0335
Iteration 80, loss = 0.0256
--- Epoch 150 / 100000
Iteration 0, loss = 0.0084
Iteration 20, loss = 0.0132
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0258
Iteration 80, loss = 0.0143
--- Epoch 151 / 100000
Iteration 0, loss = 0.0313
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0135
Iteration 60, loss = 0.0183
Iteration 80, loss = 0.0503
--- Epoch 152 / 100000
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0128
Iteration 40, loss = 0.0259
Iteration 60, loss = 0.0301
Iteration 80, loss = 0.0156
--- Epoch 153 / 100000
Iteration 0, loss = 0.0137
Iteration 20, loss = 0.0378
Iteration 40, loss = 0.0231
Iteration 60, loss = 0.0167
Iteration 80, loss = 0.0164
--- Epoch 154 / 100000
Iteration 0, loss = 0.0162
Iteration 20, loss = 0.0229
Iteration 40, loss = 0.0284
Iteration 60, loss = 0.0121
Iteration 80, loss = 0.0207
--- Epoch 155 / 100000
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0159
Iteration 40, loss = 0.0188
Iteration 60, loss = 0.0190
Iteration 80, loss = 0.0225
--- Epoch 156 / 100000
Iteration 0, loss = 0.0281
Iteration 20, loss = 0.0389
Iteration 40, loss = 0.0348
Iteration 60, loss = 0.0414
Iteration 80, loss = 0.0276
--- Epoch 157 / 100000
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0173
Iteration 40, loss = 0.0189
Iteration 60, loss = 0.0467
Iteration 80, loss = 0.0183
--- Epoch 158 / 100000
Iteration 0, loss = 0.0158
Iteration 20, loss = 0.0233
Iteration 40, loss = 0.0283
Iteration 60, loss = 0.0241
Iteration 80, loss = 0.0135
--- Epoch 159 / 100000
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0260
Iteration 40, loss = 0.0169
Iteration 60, loss = 0.0170
Iteration 80, loss = 0.0151
--- Epoch 160 / 100000
Iteration 0, loss = 0.0237
Iteration 20, loss = 0.0275
Iteration 40, loss = 0.0302
Iteration 60, loss = 0.0349
Iteration 80, loss = 0.0142
--- Epoch 161 / 100000
Iteration 0, loss = 0.0255
Iteration 20, loss = 0.0161
Iteration 40, loss = 0.0219
Iteration 60, loss = 0.0207
Iteration 80, loss = 0.0125
--- Epoch 162 / 100000
Iteration 0, loss = 0.0291
Iteration 20, loss = 0.0208
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0194
Iteration 80, loss = 0.0212
--- Epoch 163 / 100000
Iteration 0, loss = 0.0214
Iteration 20, loss = 0.0199
Iteration 40, loss = 0.0181
Iteration 60, loss = 0.0470
Iteration 80, loss = 0.0134
--- Epoch 164 / 100000
Iteration 0, loss = 0.0171
Iteration 20, loss = 0.0327
Iteration 40, loss = 0.0256
Iteration 60, loss = 0.0259
Iteration 80, loss = 0.0168
--- Epoch 165 / 100000
Iteration 0, loss = 0.0244
Iteration 20, loss = 0.0168
Iteration 40, loss = 0.0146
Iteration 60, loss = 0.0267
Iteration 80, loss = 0.0186
--- Epoch 166 / 100000
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0208
Iteration 40, loss = 0.0205
Iteration 60, loss = 0.0134
Iteration 80, loss = 0.0265
--- Epoch 167 / 100000
Iteration 0, loss = 0.0160
Iteration 20, loss = 0.0290
Iteration 40, loss = 0.0123
Iteration 60, loss = 0.0306
Iteration 80, loss = 0.0160
--- Epoch 168 / 100000
Iteration 0, loss = 0.0293
Iteration 20, loss = 0.0182
Iteration 40, loss = 0.0165
Iteration 60, loss = 0.0238
Iteration 80, loss = 0.0223
--- Epoch 169 / 100000
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0208
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0431
Iteration 80, loss = 0.0467
--- Epoch 170 / 100000
Iteration 0, loss = 0.0173
Iteration 20, loss = 0.0154
Iteration 40, loss = 0.0287
Iteration 60, loss = 0.0132
Iteration 80, loss = 0.0161
--- Epoch 171 / 100000
Iteration 0, loss = 0.0210
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0269
Iteration 80, loss = 0.0226
--- Epoch 172 / 100000
Iteration 0, loss = 0.0261
Iteration 20, loss = 0.0184
Iteration 40, loss = 0.0312
Iteration 60, loss = 0.0482
Iteration 80, loss = 0.0632
--- Epoch 173 / 100000
Iteration 0, loss = 0.0403
Iteration 20, loss = 0.0194
Iteration 40, loss = 0.0252
Iteration 60, loss = 0.0111
Iteration 80, loss = 0.0252
--- Epoch 174 / 100000
Iteration 0, loss = 0.0284
Iteration 20, loss = 0.0179
Iteration 40, loss = 0.0204
Iteration 60, loss = 0.0233
Iteration 80, loss = 0.0335
--- Epoch 175 / 100000
Iteration 0, loss = 0.0179
Iteration 20, loss = 0.0181
Iteration 40, loss = 0.0218
Iteration 60, loss = 0.0346
Iteration 80, loss = 0.0165
--- Epoch 176 / 100000
Iteration 0, loss = 0.0185
Iteration 20, loss = 0.0176
Iteration 40, loss = 0.0179
Iteration 60, loss = 0.0312
Iteration 80, loss = 0.0155
--- Epoch 177 / 100000
Iteration 0, loss = 0.0165
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0196
Iteration 60, loss = 0.0248
Iteration 80, loss = 0.0158
--- Epoch 178 / 100000
Iteration 0, loss = 0.0204
Iteration 20, loss = 0.0263
Iteration 40, loss = 0.0349
Iteration 60, loss = 0.0228
Iteration 80, loss = 0.0208
--- Epoch 179 / 100000
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0179
Iteration 40, loss = 0.0236
Iteration 60, loss = 0.0234
Iteration 80, loss = 0.0188
--- Epoch 180 / 100000
Iteration 0, loss = 0.0235
Iteration 20, loss = 0.0297
Iteration 40, loss = 0.0235
Iteration 60, loss = 0.0182
Iteration 80, loss = 0.0218
--- Epoch 181 / 100000
Iteration 0, loss = 0.0217
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0214
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0209
--- Epoch 182 / 100000
Iteration 0, loss = 0.0296
Iteration 20, loss = 0.0162
Iteration 40, loss = 0.0268
Iteration 60, loss = 0.0225
Iteration 80, loss = 0.0103
--- Epoch 183 / 100000
Iteration 0, loss = 0.0130
Iteration 20, loss = 0.0140
Iteration 40, loss = 0.0352
Iteration 60, loss = 0.0296
Iteration 80, loss = 0.0224
--- Epoch 184 / 100000
Iteration 0, loss = 0.0204
Iteration 20, loss = 0.0159
Iteration 40, loss = 0.0826
Iteration 60, loss = 0.0175
Iteration 80, loss = 0.0198
--- Epoch 185 / 100000
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0367
Iteration 40, loss = 0.0235
Iteration 60, loss = 0.0132
Iteration 80, loss = 0.0133
--- Epoch 186 / 100000
Iteration 0, loss = 0.0261
Iteration 20, loss = 0.0144
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0138
Iteration 80, loss = 0.0110
--- Epoch 187 / 100000
Iteration 0, loss = 0.0175
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0222
Iteration 60, loss = 0.0387
Iteration 80, loss = 0.0152
--- Epoch 188 / 100000
Iteration 0, loss = 0.0231
Iteration 20, loss = 0.0755
Iteration 40, loss = 0.0253
Iteration 60, loss = 0.0237
Iteration 80, loss = 0.0130
--- Epoch 189 / 100000
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0467
Iteration 40, loss = 0.0203
Iteration 60, loss = 0.0249
Iteration 80, loss = 0.0188
--- Epoch 190 / 100000
Iteration 0, loss = 0.0205
Iteration 20, loss = 0.0310
Iteration 40, loss = 0.0195
Iteration 60, loss = 0.0522
Iteration 80, loss = 0.0157
--- Epoch 191 / 100000
Iteration 0, loss = 0.0336
Iteration 20, loss = 0.0335
Iteration 40, loss = 0.0220
Iteration 60, loss = 0.0131
Iteration 80, loss = 0.0178
--- Epoch 192 / 100000
Iteration 0, loss = 0.0499
Iteration 20, loss = 0.0124
Iteration 40, loss = 0.0159
Iteration 60, loss = 0.0158
Iteration 80, loss = 0.0305
--- Epoch 193 / 100000
Iteration 0, loss = 0.0386
Iteration 20, loss = 0.0303
Iteration 40, loss = 0.0167
Iteration 60, loss = 0.0277
Iteration 80, loss = 0.0304
--- Epoch 194 / 100000
Iteration 0, loss = 0.0191
Iteration 20, loss = 0.0233
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0294
Iteration 80, loss = 0.0170
--- Epoch 195 / 100000
Iteration 0, loss = 0.0196
Iteration 20, loss = 0.0257
Iteration 40, loss = 0.0178
Iteration 60, loss = 0.0227
Iteration 80, loss = 0.0276
--- Epoch 196 / 100000
Iteration 0, loss = 0.0166
Iteration 20, loss = 0.0151
Iteration 40, loss = 0.0166
Iteration 60, loss = 0.0383
Iteration 80, loss = 0.0128
--- Epoch 197 / 100000
Iteration 0, loss = 0.0518
Iteration 20, loss = 0.0432
Iteration 40, loss = 0.0131
Iteration 60, loss = 0.0423
Iteration 80, loss = 0.0114
--- Epoch 198 / 100000
Iteration 0, loss = 0.0193
Iteration 20, loss = 0.0201
Iteration 40, loss = 0.0129
Iteration 60, loss = 0.0305
Iteration 80, loss = 0.0213
--- Epoch 199 / 100000
Iteration 0, loss = 0.0391
Iteration 20, loss = 0.0506
Iteration 40, loss = 0.0383
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0083
--- Epoch 200 / 100000
Iteration 0, loss = 0.0233
Iteration 20, loss = 0.0137
Iteration 40, loss = 0.0442
Iteration 60, loss = 0.0153
Iteration 80, loss = 0.0104
--- Epoch 201 / 100000
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0206
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0263
--- Epoch 202 / 100000
Iteration 0, loss = 0.0252
Iteration 20, loss = 0.0315
Iteration 40, loss = 0.0131
Iteration 60, loss = 0.0218
Iteration 80, loss = 0.0331
--- Epoch 203 / 100000
Iteration 0, loss = 0.0130
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0215
Iteration 80, loss = 0.0352
--- Epoch 204 / 100000
Iteration 0, loss = 0.0141
Iteration 20, loss = 0.0227
Iteration 40, loss = 0.0189
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0576
--- Epoch 205 / 100000
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0390
Iteration 40, loss = 0.0197
Iteration 60, loss = 0.0272
Iteration 80, loss = 0.0527
--- Epoch 206 / 100000
Iteration 0, loss = 0.0151
Iteration 20, loss = 0.0332
Iteration 40, loss = 0.0161
Iteration 60, loss = 0.0375
Iteration 80, loss = 0.0193
--- Epoch 207 / 100000
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0264
Iteration 40, loss = 0.0384
Iteration 60, loss = 0.0151
Iteration 80, loss = 0.0113
--- Epoch 208 / 100000
Iteration 0, loss = 0.0173
Iteration 20, loss = 0.0164
Iteration 40, loss = 0.0225
Iteration 60, loss = 0.0305
Iteration 80, loss = 0.0426
--- Epoch 209 / 100000
Iteration 0, loss = 0.0201
Iteration 20, loss = 0.0174
Iteration 40, loss = 0.0195
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0535
--- Epoch 210 / 100000
Iteration 0, loss = 0.0336
Iteration 20, loss = 0.0185
Iteration 40, loss = 0.0148
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0187
--- Epoch 211 / 100000
Iteration 0, loss = 0.0138
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0166
Iteration 60, loss = 0.0387
Iteration 80, loss = 0.0146
--- Epoch 212 / 100000
Iteration 0, loss = 0.0426
Iteration 20, loss = 0.0163
Iteration 40, loss = 0.0208
Iteration 60, loss = 0.0231
Iteration 80, loss = 0.0159
--- Epoch 213 / 100000
Iteration 0, loss = 0.0191
Iteration 20, loss = 0.0197
Iteration 40, loss = 0.0186
Iteration 60, loss = 0.0188
Iteration 80, loss = 0.0134
--- Epoch 214 / 100000
Iteration 0, loss = 0.0200
Iteration 20, loss = 0.0241
Iteration 40, loss = 0.0481
Iteration 60, loss = 0.0145
Iteration 80, loss = 0.0159
--- Epoch 215 / 100000
Iteration 0, loss = 0.0290
Iteration 20, loss = 0.0147
Iteration 40, loss = 0.0154
Iteration 60, loss = 0.0167
Iteration 80, loss = 0.0195
--- Epoch 216 / 100000
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0301
Iteration 60, loss = 0.0157
Iteration 80, loss = 0.0271
--- Epoch 217 / 100000
Iteration 0, loss = 0.0168
Iteration 20, loss = 0.0391
Iteration 40, loss = 0.0169
Iteration 60, loss = 0.0233
Iteration 80, loss = 0.0152
--- Epoch 218 / 100000
Iteration 0, loss = 0.0178
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0317
Iteration 80, loss = 0.0127
--- Epoch 219 / 100000
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0240
Iteration 40, loss = 0.0303
Iteration 60, loss = 0.0134
Iteration 80, loss = 0.0240
--- Epoch 220 / 100000
Iteration 0, loss = 0.0267
Iteration 20, loss = 0.0303
Iteration 40, loss = 0.0165
Iteration 60, loss = 0.0214
Iteration 80, loss = 0.0188
--- Epoch 221 / 100000
Iteration 0, loss = 0.0349
Iteration 20, loss = 0.0213
Iteration 40, loss = 0.0167
Iteration 60, loss = 0.0182
Iteration 80, loss = 0.0244
--- Epoch 222 / 100000
Iteration 0, loss = 0.0168
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0324
Iteration 60, loss = 0.0273
Iteration 80, loss = 0.0412
--- Epoch 223 / 100000
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0443
Iteration 40, loss = 0.0175
Iteration 60, loss = 0.0237
Iteration 80, loss = 0.0125
--- Epoch 224 / 100000
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0141
Iteration 60, loss = 0.0121
Iteration 80, loss = 0.0248
--- Epoch 225 / 100000
Iteration 0, loss = 0.0357
Iteration 20, loss = 0.0328
Iteration 40, loss = 0.0188
Iteration 60, loss = 0.0132
Iteration 80, loss = 0.0222
--- Epoch 226 / 100000
Iteration 0, loss = 0.0186
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0377
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0282
--- Epoch 227 / 100000
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0350
Iteration 40, loss = 0.0141
Iteration 60, loss = 0.0138
Iteration 80, loss = 0.0222
--- Epoch 228 / 100000
Iteration 0, loss = 0.0126
Iteration 20, loss = 0.0192
Iteration 40, loss = 0.0261
Iteration 60, loss = 0.0427
Iteration 80, loss = 0.0161
--- Epoch 229 / 100000
Iteration 0, loss = 0.0184
Iteration 20, loss = 0.0187
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0212
Iteration 80, loss = 0.0161
--- Epoch 230 / 100000
Iteration 0, loss = 0.0542
Iteration 20, loss = 0.0132
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0166
Iteration 80, loss = 0.0132
--- Epoch 231 / 100000
Iteration 0, loss = 0.0137
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0155
--- Epoch 232 / 100000
Iteration 0, loss = 0.0279
Iteration 20, loss = 0.0131
Iteration 40, loss = 0.0181
Iteration 60, loss = 0.0260
Iteration 80, loss = 0.0181
--- Epoch 233 / 100000
Iteration 0, loss = 0.0265
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0249
Iteration 80, loss = 0.0182
--- Epoch 234 / 100000
Iteration 0, loss = 0.0325
Iteration 20, loss = 0.0221
Iteration 40, loss = 0.0183
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0281
--- Epoch 235 / 100000
Iteration 0, loss = 0.0190
Iteration 20, loss = 0.0462
Iteration 40, loss = 0.0110
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0188
--- Epoch 236 / 100000
Iteration 0, loss = 0.0195
Iteration 20, loss = 0.0261
Iteration 40, loss = 0.0152
Iteration 60, loss = 0.0241
Iteration 80, loss = 0.0319
--- Epoch 237 / 100000
Iteration 0, loss = 0.0203
Iteration 20, loss = 0.0188
Iteration 40, loss = 0.0285
Iteration 60, loss = 0.0210
Iteration 80, loss = 0.0250
--- Epoch 238 / 100000
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0245
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0151
Iteration 80, loss = 0.0082
--- Epoch 239 / 100000
Iteration 0, loss = 0.0137
Iteration 20, loss = 0.0241
Iteration 40, loss = 0.0162
Iteration 60, loss = 0.0236
Iteration 80, loss = 0.0126
--- Epoch 240 / 100000
Iteration 0, loss = 0.0236
Iteration 20, loss = 0.0275
Iteration 40, loss = 0.0608
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0137
--- Epoch 241 / 100000
Iteration 0, loss = 0.0311
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0183
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0411
--- Epoch 242 / 100000
Iteration 0, loss = 0.0228
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0445
Iteration 60, loss = 0.0192
Iteration 80, loss = 0.0320
--- Epoch 243 / 100000
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0199
Iteration 40, loss = 0.0151
Iteration 60, loss = 0.0260
Iteration 80, loss = 0.0122
--- Epoch 244 / 100000
Iteration 0, loss = 0.0227
Iteration 20, loss = 0.0210
Iteration 40, loss = 0.0123
Iteration 60, loss = 0.0477
Iteration 80, loss = 0.0309
--- Epoch 245 / 100000
Iteration 0, loss = 0.0097
Iteration 20, loss = 0.0131
Iteration 40, loss = 0.0164
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0693
--- Epoch 246 / 100000
Iteration 0, loss = 0.0169
Iteration 20, loss = 0.0241
Iteration 40, loss = 0.0192
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0239
--- Epoch 247 / 100000
Iteration 0, loss = 0.0300
Iteration 20, loss = 0.0146
Iteration 40, loss = 0.0233
Iteration 60, loss = 0.0184
Iteration 80, loss = 0.0221
--- Epoch 248 / 100000
Iteration 0, loss = 0.0217
Iteration 20, loss = 0.0191
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0199
--- Epoch 249 / 100000
Iteration 0, loss = 0.0491
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0175
Iteration 60, loss = 0.0238
Iteration 80, loss = 0.0150
--- Epoch 250 / 100000
Iteration 0, loss = 0.0211
Iteration 20, loss = 0.0223
Iteration 40, loss = 0.0218
Iteration 60, loss = 0.0210
Iteration 80, loss = 0.0136
--- Epoch 251 / 100000
Iteration 0, loss = 0.0109
Iteration 20, loss = 0.0214
Iteration 40, loss = 0.0113
Iteration 60, loss = 0.0179
Iteration 80, loss = 0.0232
--- Epoch 252 / 100000
Iteration 0, loss = 0.0195
Iteration 20, loss = 0.0133
Iteration 40, loss = 0.0386
Iteration 60, loss = 0.0132
Iteration 80, loss = 0.0414
--- Epoch 253 / 100000
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0299
Iteration 40, loss = 0.0285
Iteration 60, loss = 0.0370
Iteration 80, loss = 0.0100
--- Epoch 254 / 100000
Iteration 0, loss = 0.0438
Iteration 20, loss = 0.0639
Iteration 40, loss = 0.0157
Iteration 60, loss = 0.0210
Iteration 80, loss = 0.0116
--- Epoch 255 / 100000
Iteration 0, loss = 0.0239
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0084
--- Epoch 256 / 100000
Iteration 0, loss = 0.0178
Iteration 20, loss = 0.0268
Iteration 40, loss = 0.0113
Iteration 60, loss = 0.0278
Iteration 80, loss = 0.0157
--- Epoch 257 / 100000
Iteration 0, loss = 0.0178
Iteration 20, loss = 0.0385
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0159
Iteration 80, loss = 0.0119
--- Epoch 258 / 100000
Iteration 0, loss = 0.0312
Iteration 20, loss = 0.0140
Iteration 40, loss = 0.0195
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0161
--- Epoch 259 / 100000
Iteration 0, loss = 0.0274
Iteration 20, loss = 0.0339
Iteration 40, loss = 0.0163
Iteration 60, loss = 0.0164
Iteration 80, loss = 0.0158
--- Epoch 260 / 100000
Iteration 0, loss = 0.0286
Iteration 20, loss = 0.0190
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0121
Iteration 80, loss = 0.0119
--- Epoch 261 / 100000
Iteration 0, loss = 0.0310
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0286
Iteration 60, loss = 0.0142
Iteration 80, loss = 0.0143
--- Epoch 262 / 100000
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0169
Iteration 40, loss = 0.0240
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0171
--- Epoch 263 / 100000
Iteration 0, loss = 0.0145
Iteration 20, loss = 0.0166
Iteration 40, loss = 0.0256
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0127
--- Epoch 264 / 100000
Iteration 0, loss = 0.0533
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0232
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0112
--- Epoch 265 / 100000
Iteration 0, loss = 0.0259
Iteration 20, loss = 0.0187
Iteration 40, loss = 0.0311
Iteration 60, loss = 0.0157
Iteration 80, loss = 0.0138
--- Epoch 266 / 100000
Iteration 0, loss = 0.0211
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0206
Iteration 60, loss = 0.0181
Iteration 80, loss = 0.0183
--- Epoch 267 / 100000
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0233
Iteration 40, loss = 0.0335
Iteration 60, loss = 0.0284
Iteration 80, loss = 0.0136
--- Epoch 268 / 100000
Iteration 0, loss = 0.0205
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0384
Iteration 60, loss = 0.0290
Iteration 80, loss = 0.0230
--- Epoch 269 / 100000
Iteration 0, loss = 0.0184
Iteration 20, loss = 0.0129
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0301
Iteration 80, loss = 0.0269
--- Epoch 270 / 100000
Iteration 0, loss = 0.0226
Iteration 20, loss = 0.0190
Iteration 40, loss = 0.0204
Iteration 60, loss = 0.0163
Iteration 80, loss = 0.0176
--- Epoch 271 / 100000
Iteration 0, loss = 0.0162
Iteration 20, loss = 0.0206
Iteration 40, loss = 0.0270
Iteration 60, loss = 0.0115
Iteration 80, loss = 0.0294
--- Epoch 272 / 100000
Iteration 0, loss = 0.0153
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0187
Iteration 60, loss = 0.0216
Iteration 80, loss = 0.0146
--- Epoch 273 / 100000
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0207
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0210
--- Epoch 274 / 100000
Iteration 0, loss = 0.0212
Iteration 20, loss = 0.0189
Iteration 40, loss = 0.0230
Iteration 60, loss = 0.0398
Iteration 80, loss = 0.0107
--- Epoch 275 / 100000
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0151
Iteration 60, loss = 0.0244
Iteration 80, loss = 0.0266
--- Epoch 276 / 100000
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0172
Iteration 60, loss = 0.0175
Iteration 80, loss = 0.0137
--- Epoch 277 / 100000
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0293
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0194
--- Epoch 278 / 100000
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0328
Iteration 40, loss = 0.0181
Iteration 60, loss = 0.0208
Iteration 80, loss = 0.0216
--- Epoch 279 / 100000
Iteration 0, loss = 0.0325
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0298
Iteration 60, loss = 0.0332
Iteration 80, loss = 0.0144
--- Epoch 280 / 100000
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0280
Iteration 40, loss = 0.0196
Iteration 60, loss = 0.0230
Iteration 80, loss = 0.0292
--- Epoch 281 / 100000
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0232
Iteration 60, loss = 0.0144
Iteration 80, loss = 0.0171
--- Epoch 282 / 100000
Iteration 0, loss = 0.0265
Iteration 20, loss = 0.0164
Iteration 40, loss = 0.0182
Iteration 60, loss = 0.0159
Iteration 80, loss = 0.0220
--- Epoch 283 / 100000
Iteration 0, loss = 0.0207
Iteration 20, loss = 0.0173
Iteration 40, loss = 0.0160
Iteration 60, loss = 0.0151
Iteration 80, loss = 0.0165
--- Epoch 284 / 100000
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0188
Iteration 60, loss = 0.0157
Iteration 80, loss = 0.0258
--- Epoch 285 / 100000
Iteration 0, loss = 0.0221
Iteration 20, loss = 0.0200
Iteration 40, loss = 0.0208
Iteration 60, loss = 0.0162
Iteration 80, loss = 0.0150
--- Epoch 286 / 100000
Iteration 0, loss = 0.0276
Iteration 20, loss = 0.0157
Iteration 40, loss = 0.0148
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0335
--- Epoch 287 / 100000
Iteration 0, loss = 0.0213
Iteration 20, loss = 0.0296
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0188
Iteration 80, loss = 0.0124
--- Epoch 288 / 100000
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0147
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0388
Iteration 80, loss = 0.0169
--- Epoch 289 / 100000
Iteration 0, loss = 0.0172
Iteration 20, loss = 0.0253
Iteration 40, loss = 0.0169
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0134
--- Epoch 290 / 100000
Iteration 0, loss = 0.0276
Iteration 20, loss = 0.0216
Iteration 40, loss = 0.0249
Iteration 60, loss = 0.0217
Iteration 80, loss = 0.0330
--- Epoch 291 / 100000
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0202
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0163
--- Epoch 292 / 100000
Iteration 0, loss = 0.0615
Iteration 20, loss = 0.0176
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0384
Iteration 80, loss = 0.0094
--- Epoch 293 / 100000
Iteration 0, loss = 0.0187
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0135
Iteration 60, loss = 0.0463
Iteration 80, loss = 0.0202
--- Epoch 294 / 100000
Iteration 0, loss = 0.0172
Iteration 20, loss = 0.0170
Iteration 40, loss = 0.0171
Iteration 60, loss = 0.0116
Iteration 80, loss = 0.0103
--- Epoch 295 / 100000
Iteration 0, loss = 0.0242
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0139
Iteration 60, loss = 0.0412
Iteration 80, loss = 0.0174
--- Epoch 296 / 100000
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0282
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0192
--- Epoch 297 / 100000
Iteration 0, loss = 0.0198
Iteration 20, loss = 0.0157
Iteration 40, loss = 0.0294
Iteration 60, loss = 0.0173
Iteration 80, loss = 0.0162
--- Epoch 298 / 100000
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0141
Iteration 40, loss = 0.0170
Iteration 60, loss = 0.0157
Iteration 80, loss = 0.0142
--- Epoch 299 / 100000
Iteration 0, loss = 0.0219
Iteration 20, loss = 0.0166
Iteration 40, loss = 0.0215
Iteration 60, loss = 0.0225
Iteration 80, loss = 0.0121
--- Epoch 300 / 100000
Iteration 0, loss = 0.0449
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0593
Iteration 60, loss = 0.0182
Iteration 80, loss = 0.0200
--- Epoch 301 / 100000
Iteration 0, loss = 0.0127
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0165
Iteration 80, loss = 0.0166
--- Epoch 302 / 100000
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0218
Iteration 40, loss = 0.0135
Iteration 60, loss = 0.0185
Iteration 80, loss = 0.0130
--- Epoch 303 / 100000
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0184
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0156
Iteration 80, loss = 0.0190
--- Epoch 304 / 100000
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0208
Iteration 40, loss = 0.0311
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0201
--- Epoch 305 / 100000
Iteration 0, loss = 0.0597
Iteration 20, loss = 0.0251
Iteration 40, loss = 0.0241
Iteration 60, loss = 0.0175
Iteration 80, loss = 0.0152
--- Epoch 306 / 100000
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0155
Iteration 40, loss = 0.0152
Iteration 60, loss = 0.0319
Iteration 80, loss = 0.0282
--- Epoch 307 / 100000
Iteration 0, loss = 0.0154
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0171
Iteration 60, loss = 0.0342
Iteration 80, loss = 0.0150
--- Epoch 308 / 100000
Iteration 0, loss = 0.0174
Iteration 20, loss = 0.0217
Iteration 40, loss = 0.0163
Iteration 60, loss = 0.0136
Iteration 80, loss = 0.0193
--- Epoch 309 / 100000
Iteration 0, loss = 0.0170
Iteration 20, loss = 0.0317
Iteration 40, loss = 0.0203
Iteration 60, loss = 0.0164
Iteration 80, loss = 0.0251
--- Epoch 310 / 100000
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0189
Iteration 40, loss = 0.0159
Iteration 60, loss = 0.0188
Iteration 80, loss = 0.0189
--- Epoch 311 / 100000
Iteration 0, loss = 0.0185
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0213
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0244
--- Epoch 312 / 100000
Iteration 0, loss = 0.0299
Iteration 20, loss = 0.0275
Iteration 40, loss = 0.0160
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0127
--- Epoch 313 / 100000
Iteration 0, loss = 0.0338
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0152
Iteration 60, loss = 0.0288
Iteration 80, loss = 0.0178
--- Epoch 314 / 100000
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0223
Iteration 40, loss = 0.0195
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0123
--- Epoch 315 / 100000
Iteration 0, loss = 0.0757
Iteration 20, loss = 0.0162
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0211
Iteration 80, loss = 0.0231
--- Epoch 316 / 100000
Iteration 0, loss = 0.0224
Iteration 20, loss = 0.0346
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0098
--- Epoch 317 / 100000
Iteration 0, loss = 0.0225
Iteration 20, loss = 0.0290
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0157
Iteration 80, loss = 0.0209
--- Epoch 318 / 100000
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0329
Iteration 40, loss = 0.0322
Iteration 60, loss = 0.0344
Iteration 80, loss = 0.0181
--- Epoch 319 / 100000
Iteration 0, loss = 0.0254
Iteration 20, loss = 0.0129
Iteration 40, loss = 0.0187
Iteration 60, loss = 0.0188
Iteration 80, loss = 0.0283
--- Epoch 320 / 100000
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0154
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0248
--- Epoch 321 / 100000
Iteration 0, loss = 0.0214
Iteration 20, loss = 0.0172
Iteration 40, loss = 0.0312
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0154
--- Epoch 322 / 100000
Iteration 0, loss = 0.0233
Iteration 20, loss = 0.0201
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0204
Iteration 80, loss = 0.0228
--- Epoch 323 / 100000
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0171
Iteration 60, loss = 0.0226
Iteration 80, loss = 0.0230
--- Epoch 324 / 100000
Iteration 0, loss = 0.0394
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0300
--- Epoch 325 / 100000
Iteration 0, loss = 0.0139
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0329
Iteration 80, loss = 0.0155
--- Epoch 326 / 100000
Iteration 0, loss = 0.0243
Iteration 20, loss = 0.0350
Iteration 40, loss = 0.0203
Iteration 60, loss = 0.0193
Iteration 80, loss = 0.0106
--- Epoch 327 / 100000
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0670
--- Epoch 328 / 100000
Iteration 0, loss = 0.0449
Iteration 20, loss = 0.0281
Iteration 40, loss = 0.0131
Iteration 60, loss = 0.0258
Iteration 80, loss = 0.0148
--- Epoch 329 / 100000
Iteration 0, loss = 0.0136
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0171
Iteration 80, loss = 0.0214
--- Epoch 330 / 100000
Iteration 0, loss = 0.0172
Iteration 20, loss = 0.0245
Iteration 40, loss = 0.0162
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0198
--- Epoch 331 / 100000
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0306
Iteration 40, loss = 0.0233
Iteration 60, loss = 0.0298
Iteration 80, loss = 0.0296
--- Epoch 332 / 100000
Iteration 0, loss = 0.0178
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0149
--- Epoch 333 / 100000
Iteration 0, loss = 0.0316
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0276
Iteration 60, loss = 0.0123
Iteration 80, loss = 0.0187
--- Epoch 334 / 100000
Iteration 0, loss = 0.0274
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0137
Iteration 60, loss = 0.0238
Iteration 80, loss = 0.0116
--- Epoch 335 / 100000
Iteration 0, loss = 0.0178
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0175
Iteration 80, loss = 0.0198
--- Epoch 336 / 100000
Iteration 0, loss = 0.0153
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0229
Iteration 80, loss = 0.0162
--- Epoch 337 / 100000
Iteration 0, loss = 0.0214
Iteration 20, loss = 0.0187
Iteration 40, loss = 0.0187
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0152
--- Epoch 338 / 100000
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0312
Iteration 40, loss = 0.0263
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0169
--- Epoch 339 / 100000
Iteration 0, loss = 0.0204
Iteration 20, loss = 0.0144
Iteration 40, loss = 0.0198
Iteration 60, loss = 0.0250
Iteration 80, loss = 0.0427
--- Epoch 340 / 100000
Iteration 0, loss = 0.0238
Iteration 20, loss = 0.0278
Iteration 40, loss = 0.0129
Iteration 60, loss = 0.0131
Iteration 80, loss = 0.0282
--- Epoch 341 / 100000
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0532
Iteration 40, loss = 0.0324
Iteration 60, loss = 0.0156
Iteration 80, loss = 0.0313
--- Epoch 342 / 100000
Iteration 0, loss = 0.0183
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0144
Iteration 60, loss = 0.0202
Iteration 80, loss = 0.0328
--- Epoch 343 / 100000
Iteration 0, loss = 0.0270
Iteration 20, loss = 0.0157
Iteration 40, loss = 0.0209
Iteration 60, loss = 0.0108
Iteration 80, loss = 0.0212
--- Epoch 344 / 100000
Iteration 0, loss = 0.0232
Iteration 20, loss = 0.0128
Iteration 40, loss = 0.0200
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0217
--- Epoch 345 / 100000
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0194
Iteration 40, loss = 0.0461
Iteration 60, loss = 0.0156
Iteration 80, loss = 0.0125
--- Epoch 346 / 100000
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0210
Iteration 40, loss = 0.0177
Iteration 60, loss = 0.0233
Iteration 80, loss = 0.0182
--- Epoch 347 / 100000
Iteration 0, loss = 0.0215
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0134
Iteration 80, loss = 0.0251
--- Epoch 348 / 100000
Iteration 0, loss = 0.0226
Iteration 20, loss = 0.0201
Iteration 40, loss = 0.0168
Iteration 60, loss = 0.0199
Iteration 80, loss = 0.0110
--- Epoch 349 / 100000
Iteration 0, loss = 0.0167
Iteration 20, loss = 0.0257
Iteration 40, loss = 0.0113
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0100
--- Epoch 350 / 100000
Iteration 0, loss = 0.0218
Iteration 20, loss = 0.0144
Iteration 40, loss = 0.0165
Iteration 60, loss = 0.0247
Iteration 80, loss = 0.0261
--- Epoch 351 / 100000
Iteration 0, loss = 0.0162
Iteration 20, loss = 0.0117
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0323
Iteration 80, loss = 0.0109
--- Epoch 352 / 100000
Iteration 0, loss = 0.0138
Iteration 20, loss = 0.0263
Iteration 40, loss = 0.0205
Iteration 60, loss = 0.0211
Iteration 80, loss = 0.0138
--- Epoch 353 / 100000
Iteration 0, loss = 0.0169
Iteration 20, loss = 0.0220
Iteration 40, loss = 0.0812
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0162
--- Epoch 354 / 100000
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0168
Iteration 40, loss = 0.0253
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0247
--- Epoch 355 / 100000
Iteration 0, loss = 0.0150
Iteration 20, loss = 0.0123
Iteration 40, loss = 0.0187
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0094
--- Epoch 356 / 100000
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0110
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0412
--- Epoch 357 / 100000
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0294
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0162
--- Epoch 358 / 100000
Iteration 0, loss = 0.0173
Iteration 20, loss = 0.0270
Iteration 40, loss = 0.0254
Iteration 60, loss = 0.0258
Iteration 80, loss = 0.0110
--- Epoch 359 / 100000
Iteration 0, loss = 0.0268
Iteration 20, loss = 0.0112
Iteration 40, loss = 0.0145
Iteration 60, loss = 0.0186
Iteration 80, loss = 0.0188
--- Epoch 360 / 100000
Iteration 0, loss = 0.0199
Iteration 20, loss = 0.0155
Iteration 40, loss = 0.0179
Iteration 60, loss = 0.0269
Iteration 80, loss = 0.0104
--- Epoch 361 / 100000
Iteration 0, loss = 0.0207
Iteration 20, loss = 0.0222
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0343
Iteration 80, loss = 0.0260
--- Epoch 362 / 100000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0170
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0168
--- Epoch 363 / 100000
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0528
Iteration 40, loss = 0.0136
Iteration 60, loss = 0.0167
Iteration 80, loss = 0.0197
--- Epoch 364 / 100000
Iteration 0, loss = 0.0203
Iteration 20, loss = 0.0194
Iteration 40, loss = 0.0522
Iteration 60, loss = 0.0343
Iteration 80, loss = 0.0220
--- Epoch 365 / 100000
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0175
Iteration 40, loss = 0.0439
Iteration 60, loss = 0.0279
Iteration 80, loss = 0.0201
--- Epoch 366 / 100000
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0153
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0164
--- Epoch 367 / 100000
Iteration 0, loss = 0.0158
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0179
Iteration 60, loss = 0.0187
Iteration 80, loss = 0.0174
--- Epoch 368 / 100000
Iteration 0, loss = 0.0160
Iteration 20, loss = 0.0195
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0403
Iteration 80, loss = 0.0219
--- Epoch 369 / 100000
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0191
Iteration 40, loss = 0.0198
Iteration 60, loss = 0.0286
Iteration 80, loss = 0.0183
--- Epoch 370 / 100000
Iteration 0, loss = 0.0120
Iteration 20, loss = 0.0247
Iteration 40, loss = 0.0152
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0081
--- Epoch 371 / 100000
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0133
Iteration 40, loss = 0.0164
Iteration 60, loss = 0.0180
Iteration 80, loss = 0.0092
--- Epoch 372 / 100000
Iteration 0, loss = 0.0154
Iteration 20, loss = 0.0193
Iteration 40, loss = 0.0262
Iteration 60, loss = 0.0182
Iteration 80, loss = 0.0140
--- Epoch 373 / 100000
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0156
Iteration 40, loss = 0.0189
Iteration 60, loss = 0.0156
Iteration 80, loss = 0.0184
--- Epoch 374 / 100000
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0218
Iteration 40, loss = 0.0171
Iteration 60, loss = 0.0278
Iteration 80, loss = 0.0392
--- Epoch 375 / 100000
Iteration 0, loss = 0.0318
Iteration 20, loss = 0.0263
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0166
Iteration 80, loss = 0.0160
--- Epoch 376 / 100000
Iteration 0, loss = 0.0211
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0238
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0219
--- Epoch 377 / 100000
Iteration 0, loss = 0.0172
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0378
Iteration 80, loss = 0.0192
--- Epoch 378 / 100000
Iteration 0, loss = 0.0179
Iteration 20, loss = 0.0147
Iteration 40, loss = 0.0328
Iteration 60, loss = 0.0279
Iteration 80, loss = 0.0270
--- Epoch 379 / 100000
Iteration 0, loss = 0.0270
Iteration 20, loss = 0.0253
Iteration 40, loss = 0.0251
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0186
--- Epoch 380 / 100000
Iteration 0, loss = 0.0163
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0287
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0267
--- Epoch 381 / 100000
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0136
Iteration 40, loss = 0.0253
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0153
--- Epoch 382 / 100000
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0198
Iteration 40, loss = 0.0133
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0128
--- Epoch 383 / 100000
Iteration 0, loss = 0.0235
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0196
Iteration 60, loss = 0.0154
Iteration 80, loss = 0.0117
--- Epoch 384 / 100000
Iteration 0, loss = 0.0141
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0244
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0164
--- Epoch 385 / 100000
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0205
Iteration 40, loss = 0.0202
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0160
--- Epoch 386 / 100000
Iteration 0, loss = 0.0097
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0128
Iteration 80, loss = 0.0122
--- Epoch 387 / 100000
Iteration 0, loss = 0.0120
Iteration 20, loss = 0.0162
Iteration 40, loss = 0.0224
Iteration 60, loss = 0.0173
Iteration 80, loss = 0.0359
--- Epoch 388 / 100000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0140
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0225
Iteration 80, loss = 0.0276
--- Epoch 389 / 100000
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0151
Iteration 60, loss = 0.0161
Iteration 80, loss = 0.0226
--- Epoch 390 / 100000
Iteration 0, loss = 0.0160
Iteration 20, loss = 0.0153
Iteration 40, loss = 0.0199
Iteration 60, loss = 0.0168
Iteration 80, loss = 0.0223
--- Epoch 391 / 100000
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0145
Iteration 60, loss = 0.0229
Iteration 80, loss = 0.0173
--- Epoch 392 / 100000
Iteration 0, loss = 0.0152
Iteration 20, loss = 0.0179
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0128
Iteration 80, loss = 0.0269
--- Epoch 393 / 100000
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0275
Iteration 40, loss = 0.0184
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0179
--- Epoch 394 / 100000
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0205
Iteration 40, loss = 0.0173
Iteration 60, loss = 0.0278
Iteration 80, loss = 0.0695
--- Epoch 395 / 100000
Iteration 0, loss = 0.0172
Iteration 20, loss = 0.0136
Iteration 40, loss = 0.0155
Iteration 60, loss = 0.0184
Iteration 80, loss = 0.0147
--- Epoch 396 / 100000
Iteration 0, loss = 0.0136
Iteration 20, loss = 0.0214
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0228
Iteration 80, loss = 0.0153
--- Epoch 397 / 100000
Iteration 0, loss = 0.0355
Iteration 20, loss = 0.0160
Iteration 40, loss = 0.0347
Iteration 60, loss = 0.0134
Iteration 80, loss = 0.0088
--- Epoch 398 / 100000
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0197
Iteration 60, loss = 0.0218
Iteration 80, loss = 0.0249
--- Epoch 399 / 100000
Iteration 0, loss = 0.0217
Iteration 20, loss = 0.0366
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0176
Iteration 80, loss = 0.0122
--- Epoch 400 / 100000
Iteration 0, loss = 0.0145
Iteration 20, loss = 0.0167
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0291
Iteration 80, loss = 0.0145
--- Epoch 401 / 100000
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0200
Iteration 40, loss = 0.0188
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0305
--- Epoch 402 / 100000
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0215
Iteration 40, loss = 0.0242
Iteration 60, loss = 0.0136
Iteration 80, loss = 0.0164
--- Epoch 403 / 100000
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0230
Iteration 40, loss = 0.0242
Iteration 60, loss = 0.0151
Iteration 80, loss = 0.0315
--- Epoch 404 / 100000
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0185
Iteration 80, loss = 0.0122
--- Epoch 405 / 100000
Iteration 0, loss = 0.0269
Iteration 20, loss = 0.0252
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0179
--- Epoch 406 / 100000
Iteration 0, loss = 0.0161
Iteration 20, loss = 0.0418
Iteration 40, loss = 0.0218
Iteration 60, loss = 0.0163
Iteration 80, loss = 0.0153
--- Epoch 407 / 100000
Iteration 0, loss = 0.0161
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0298
Iteration 60, loss = 0.0225
Iteration 80, loss = 0.0206
--- Epoch 408 / 100000
Iteration 0, loss = 0.0160
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0214
Iteration 60, loss = 0.0237
Iteration 80, loss = 0.0137
--- Epoch 409 / 100000
Iteration 0, loss = 0.0163
Iteration 20, loss = 0.0401
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0118
--- Epoch 410 / 100000
Iteration 0, loss = 0.0165
Iteration 20, loss = 0.0385
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0164
--- Epoch 411 / 100000
Iteration 0, loss = 0.0293
Iteration 20, loss = 0.0213
Iteration 40, loss = 0.0363
Iteration 60, loss = 0.0120
Iteration 80, loss = 0.0143
--- Epoch 412 / 100000
Iteration 0, loss = 0.0225
Iteration 20, loss = 0.0174
Iteration 40, loss = 0.0160
Iteration 60, loss = 0.0177
Iteration 80, loss = 0.0118
--- Epoch 413 / 100000
Iteration 0, loss = 0.0401
Iteration 20, loss = 0.0250
Iteration 40, loss = 0.0173
Iteration 60, loss = 0.0154
Iteration 80, loss = 0.0183
--- Epoch 414 / 100000
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0176
Iteration 40, loss = 0.0163
Iteration 60, loss = 0.0150
Iteration 80, loss = 0.0103
--- Epoch 415 / 100000
Iteration 0, loss = 0.0212
Iteration 20, loss = 0.0343
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0183
Iteration 80, loss = 0.0162
--- Epoch 416 / 100000
Iteration 0, loss = 0.0136
Iteration 20, loss = 0.0156
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0134
Iteration 80, loss = 0.0094
--- Epoch 417 / 100000
Iteration 0, loss = 0.0154
Iteration 20, loss = 0.0153
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0117
--- Epoch 418 / 100000
Iteration 0, loss = 0.0136
Iteration 20, loss = 0.0190
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0193
Iteration 80, loss = 0.0423
--- Epoch 419 / 100000
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0161
Iteration 60, loss = 0.0350
Iteration 80, loss = 0.0222
--- Epoch 420 / 100000
Iteration 0, loss = 0.0192
Iteration 20, loss = 0.0157
Iteration 40, loss = 0.0155
Iteration 60, loss = 0.0293
Iteration 80, loss = 0.0338
--- Epoch 421 / 100000
Iteration 0, loss = 0.0224
Iteration 20, loss = 0.0416
Iteration 40, loss = 0.0184
Iteration 60, loss = 0.0193
Iteration 80, loss = 0.0551
--- Epoch 422 / 100000
Iteration 0, loss = 0.0126
Iteration 20, loss = 0.0160
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0333
Iteration 80, loss = 0.0333
--- Epoch 423 / 100000
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0236
Iteration 40, loss = 0.0154
Iteration 60, loss = 0.0169
Iteration 80, loss = 0.0137
--- Epoch 424 / 100000
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0253
Iteration 60, loss = 0.0187
Iteration 80, loss = 0.0219
--- Epoch 425 / 100000
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0491
Iteration 40, loss = 0.0204
Iteration 60, loss = 0.0168
Iteration 80, loss = 0.0156
--- Epoch 426 / 100000
Iteration 0, loss = 0.0202
Iteration 20, loss = 0.0567
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0153
Iteration 80, loss = 0.0102
--- Epoch 427 / 100000
Iteration 0, loss = 0.0240
Iteration 20, loss = 0.0322
Iteration 40, loss = 0.0495
Iteration 60, loss = 0.0305
Iteration 80, loss = 0.0118
--- Epoch 428 / 100000
Iteration 0, loss = 0.0141
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0204
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0138
--- Epoch 429 / 100000
Iteration 0, loss = 0.0120
Iteration 20, loss = 0.0160
Iteration 40, loss = 0.0237
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0098
--- Epoch 430 / 100000
Iteration 0, loss = 0.0135
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0219
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0083
--- Epoch 431 / 100000
Iteration 0, loss = 0.0186
Iteration 20, loss = 0.0258
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0209
Iteration 80, loss = 0.0248
--- Epoch 432 / 100000
Iteration 0, loss = 0.0209
Iteration 20, loss = 0.0305
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0188
Iteration 80, loss = 0.0102
--- Epoch 433 / 100000
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0157
Iteration 40, loss = 0.0215
Iteration 60, loss = 0.0175
Iteration 80, loss = 0.0255
--- Epoch 434 / 100000
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0240
Iteration 40, loss = 0.0157
Iteration 60, loss = 0.0209
Iteration 80, loss = 0.0151
--- Epoch 435 / 100000
Iteration 0, loss = 0.0213
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0102
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0205
--- Epoch 436 / 100000
Iteration 0, loss = 0.0255
Iteration 20, loss = 0.0184
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0196
Iteration 80, loss = 0.0290
--- Epoch 437 / 100000
Iteration 0, loss = 0.0083
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0156
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0097
--- Epoch 438 / 100000
Iteration 0, loss = 0.0168
Iteration 20, loss = 0.0167
Iteration 40, loss = 0.0198
Iteration 60, loss = 0.0320
Iteration 80, loss = 0.0286
--- Epoch 439 / 100000
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0263
Iteration 40, loss = 0.0078
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0160
--- Epoch 440 / 100000
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0277
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0312
--- Epoch 441 / 100000
Iteration 0, loss = 0.0164
Iteration 20, loss = 0.0183
Iteration 40, loss = 0.0161
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0232
--- Epoch 442 / 100000
Iteration 0, loss = 0.0209
Iteration 20, loss = 0.0226
Iteration 40, loss = 0.0171
Iteration 60, loss = 0.0367
Iteration 80, loss = 0.0121
--- Epoch 443 / 100000
Iteration 0, loss = 0.0173
Iteration 20, loss = 0.0141
Iteration 40, loss = 0.0180
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0252
--- Epoch 444 / 100000
Iteration 0, loss = 0.0169
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0177
Iteration 60, loss = 0.0256
Iteration 80, loss = 0.0089
--- Epoch 445 / 100000
Iteration 0, loss = 0.0130
Iteration 20, loss = 0.0182
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0144
Iteration 80, loss = 0.0206
--- Epoch 446 / 100000
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0235
Iteration 80, loss = 0.0122
--- Epoch 447 / 100000
Iteration 0, loss = 0.0138
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0683
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0289
--- Epoch 448 / 100000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0248
Iteration 80, loss = 0.0295
--- Epoch 449 / 100000
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0296
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0166
--- Epoch 450 / 100000
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0092
--- Epoch 451 / 100000
Iteration 0, loss = 0.0120
Iteration 20, loss = 0.0174
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0163
Iteration 80, loss = 0.0466
--- Epoch 452 / 100000
Iteration 0, loss = 0.0236
Iteration 20, loss = 0.0208
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0392
Iteration 80, loss = 0.0374
--- Epoch 453 / 100000
Iteration 0, loss = 0.0205
Iteration 20, loss = 0.0117
Iteration 40, loss = 0.0183
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0364
--- Epoch 454 / 100000
Iteration 0, loss = 0.0177
Iteration 20, loss = 0.0160
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0340
Iteration 80, loss = 0.0151
--- Epoch 455 / 100000
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0163
Iteration 60, loss = 0.0370
Iteration 80, loss = 0.0154
--- Epoch 456 / 100000
Iteration 0, loss = 0.0211
Iteration 20, loss = 0.0099
Iteration 40, loss = 0.0272
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0141
--- Epoch 457 / 100000
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0141
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0315
--- Epoch 458 / 100000
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0252
Iteration 40, loss = 0.0165
Iteration 60, loss = 0.0160
Iteration 80, loss = 0.0102
--- Epoch 459 / 100000
Iteration 0, loss = 0.0163
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0233
--- Epoch 460 / 100000
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0169
Iteration 40, loss = 0.0145
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0226
--- Epoch 461 / 100000
Iteration 0, loss = 0.0298
Iteration 20, loss = 0.0283
Iteration 40, loss = 0.0169
Iteration 60, loss = 0.0151
Iteration 80, loss = 0.0165
--- Epoch 462 / 100000
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0234
Iteration 40, loss = 0.0141
Iteration 60, loss = 0.0228
Iteration 80, loss = 0.0141
--- Epoch 463 / 100000
Iteration 0, loss = 0.0171
Iteration 20, loss = 0.0115
Iteration 40, loss = 0.0212
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0239
--- Epoch 464 / 100000
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0099
--- Epoch 465 / 100000
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0223
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0164
Iteration 80, loss = 0.0221
--- Epoch 466 / 100000
Iteration 0, loss = 0.0223
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0164
Iteration 60, loss = 0.0123
Iteration 80, loss = 0.0260
--- Epoch 467 / 100000
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0184
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0165
Iteration 80, loss = 0.0112
--- Epoch 468 / 100000
Iteration 0, loss = 0.0300
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0227
Iteration 80, loss = 0.0168
--- Epoch 469 / 100000
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0144
Iteration 40, loss = 0.0179
Iteration 60, loss = 0.0162
Iteration 80, loss = 0.0116
--- Epoch 470 / 100000
Iteration 0, loss = 0.0193
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0270
Iteration 60, loss = 0.0225
Iteration 80, loss = 0.0073
--- Epoch 471 / 100000
Iteration 0, loss = 0.0150
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0145
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0138
--- Epoch 472 / 100000
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0158
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0189
--- Epoch 473 / 100000
Iteration 0, loss = 0.0198
Iteration 20, loss = 0.0256
Iteration 40, loss = 0.0198
Iteration 60, loss = 0.0171
Iteration 80, loss = 0.0167
--- Epoch 474 / 100000
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0302
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0090
--- Epoch 475 / 100000
Iteration 0, loss = 0.0131
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0269
Iteration 60, loss = 0.0203
Iteration 80, loss = 0.0296
--- Epoch 476 / 100000
Iteration 0, loss = 0.0193
Iteration 20, loss = 0.0174
Iteration 40, loss = 0.0235
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0119
--- Epoch 477 / 100000
Iteration 0, loss = 0.0181
Iteration 20, loss = 0.0162
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0138
--- Epoch 478 / 100000
Iteration 0, loss = 0.0240
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0180
Iteration 80, loss = 0.0255
--- Epoch 479 / 100000
Iteration 0, loss = 0.0103
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0157
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0184
--- Epoch 480 / 100000
Iteration 0, loss = 0.0378
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0187
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0140
--- Epoch 481 / 100000
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0265
Iteration 40, loss = 0.0238
Iteration 60, loss = 0.0151
Iteration 80, loss = 0.0229
--- Epoch 482 / 100000
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0198
Iteration 40, loss = 0.0273
Iteration 60, loss = 0.0189
Iteration 80, loss = 0.0219
--- Epoch 483 / 100000
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0156
Iteration 60, loss = 0.0228
Iteration 80, loss = 0.0102
--- Epoch 484 / 100000
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0181
Iteration 80, loss = 0.0344
--- Epoch 485 / 100000
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0154
Iteration 40, loss = 0.0240
Iteration 60, loss = 0.0281
Iteration 80, loss = 0.0184
--- Epoch 486 / 100000
Iteration 0, loss = 0.0145
Iteration 20, loss = 0.0176
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0278
Iteration 80, loss = 0.0152
--- Epoch 487 / 100000
Iteration 0, loss = 0.0166
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0144
Iteration 60, loss = 0.0159
Iteration 80, loss = 0.0219
--- Epoch 488 / 100000
Iteration 0, loss = 0.0193
Iteration 20, loss = 0.0452
Iteration 40, loss = 0.0147
Iteration 60, loss = 0.0157
Iteration 80, loss = 0.0186
--- Epoch 489 / 100000
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0208
Iteration 40, loss = 0.0151
Iteration 60, loss = 0.0156
Iteration 80, loss = 0.0140
--- Epoch 490 / 100000
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0292
Iteration 40, loss = 0.0241
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0104
--- Epoch 491 / 100000
Iteration 0, loss = 0.0150
Iteration 20, loss = 0.0151
Iteration 40, loss = 0.0102
Iteration 60, loss = 0.0315
Iteration 80, loss = 0.0228
--- Epoch 492 / 100000
Iteration 0, loss = 0.0165
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0168
--- Epoch 493 / 100000
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0403
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0174
Iteration 80, loss = 0.0131
--- Epoch 494 / 100000
Iteration 0, loss = 0.0318
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0102
Iteration 60, loss = 0.0250
Iteration 80, loss = 0.0122
--- Epoch 495 / 100000
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0246
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0272
--- Epoch 496 / 100000
Iteration 0, loss = 0.0237
Iteration 20, loss = 0.0136
Iteration 40, loss = 0.0164
Iteration 60, loss = 0.0210
Iteration 80, loss = 0.0198
--- Epoch 497 / 100000
Iteration 0, loss = 0.0164
Iteration 20, loss = 0.0137
Iteration 40, loss = 0.0200
Iteration 60, loss = 0.0153
Iteration 80, loss = 0.0397
--- Epoch 498 / 100000
Iteration 0, loss = 0.0227
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0182
Iteration 80, loss = 0.0153
--- Epoch 499 / 100000
Iteration 0, loss = 0.0196
Iteration 20, loss = 0.0161
Iteration 40, loss = 0.0181
Iteration 60, loss = 0.0184
Iteration 80, loss = 0.0283
--- Epoch 500 / 100000
Iteration 0, loss = 0.0173
Iteration 20, loss = 0.0285
Iteration 40, loss = 0.0156
Iteration 60, loss = 0.0172
Iteration 80, loss = 0.0166
--- Epoch 501 / 100000
Iteration 0, loss = 0.0139
Iteration 20, loss = 0.0196
Iteration 40, loss = 0.0135
Iteration 60, loss = 0.0169
Iteration 80, loss = 0.0102
--- Epoch 502 / 100000
Iteration 0, loss = 0.0172
Iteration 20, loss = 0.0169
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0506
--- Epoch 503 / 100000
Iteration 0, loss = 0.0139
Iteration 20, loss = 0.0272
Iteration 40, loss = 0.0237
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0079
--- Epoch 504 / 100000
Iteration 0, loss = 0.0388
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0154
Iteration 60, loss = 0.0137
Iteration 80, loss = 0.0264
--- Epoch 505 / 100000
Iteration 0, loss = 0.0171
Iteration 20, loss = 0.0265
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0169
Iteration 80, loss = 0.0155
--- Epoch 506 / 100000
Iteration 0, loss = 0.0268
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0220
--- Epoch 507 / 100000
Iteration 0, loss = 0.0131
Iteration 20, loss = 0.0129
Iteration 40, loss = 0.0188
Iteration 60, loss = 0.0200
Iteration 80, loss = 0.0459
--- Epoch 508 / 100000
Iteration 0, loss = 0.0207
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0163
--- Epoch 509 / 100000
Iteration 0, loss = 0.0340
Iteration 20, loss = 0.0196
Iteration 40, loss = 0.0203
Iteration 60, loss = 0.0215
Iteration 80, loss = 0.0229
--- Epoch 510 / 100000
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0139
Iteration 60, loss = 0.0165
Iteration 80, loss = 0.0223
--- Epoch 511 / 100000
Iteration 0, loss = 0.0473
Iteration 20, loss = 0.0231
Iteration 40, loss = 0.0227
Iteration 60, loss = 0.0334
Iteration 80, loss = 0.0215
--- Epoch 512 / 100000
Iteration 0, loss = 0.0200
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0158
Iteration 60, loss = 0.0189
Iteration 80, loss = 0.0278
--- Epoch 513 / 100000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0282
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0178
--- Epoch 514 / 100000
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0243
Iteration 40, loss = 0.0345
Iteration 60, loss = 0.0102
Iteration 80, loss = 0.0137
--- Epoch 515 / 100000
Iteration 0, loss = 0.0196
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0154
Iteration 60, loss = 0.0275
Iteration 80, loss = 0.0142
--- Epoch 516 / 100000
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0236
Iteration 40, loss = 0.0245
Iteration 60, loss = 0.0229
Iteration 80, loss = 0.0159
--- Epoch 517 / 100000
Iteration 0, loss = 0.0164
Iteration 20, loss = 0.0178
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0253
Iteration 80, loss = 0.0140
--- Epoch 518 / 100000
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0191
Iteration 40, loss = 0.0146
Iteration 60, loss = 0.0241
Iteration 80, loss = 0.0144
--- Epoch 519 / 100000
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0263
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0182
Iteration 80, loss = 0.0117
--- Epoch 520 / 100000
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0157
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0092
--- Epoch 521 / 100000
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0147
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0189
--- Epoch 522 / 100000
Iteration 0, loss = 0.0152
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0188
--- Epoch 523 / 100000
Iteration 0, loss = 0.0145
Iteration 20, loss = 0.0153
Iteration 40, loss = 0.0222
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0186
--- Epoch 524 / 100000
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0244
Iteration 60, loss = 0.0131
Iteration 80, loss = 0.0113
--- Epoch 525 / 100000
Iteration 0, loss = 0.0171
Iteration 20, loss = 0.0155
Iteration 40, loss = 0.0124
Iteration 60, loss = 0.0167
Iteration 80, loss = 0.0272
--- Epoch 526 / 100000
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0322
Iteration 80, loss = 0.0362
--- Epoch 527 / 100000
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0172
Iteration 60, loss = 0.0231
Iteration 80, loss = 0.0188
--- Epoch 528 / 100000
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0202
Iteration 40, loss = 0.0121
Iteration 60, loss = 0.0189
Iteration 80, loss = 0.0338
--- Epoch 529 / 100000
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0379
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0247
Iteration 80, loss = 0.0111
--- Epoch 530 / 100000
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0160
Iteration 40, loss = 0.0160
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0151
--- Epoch 531 / 100000
Iteration 0, loss = 0.0202
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0145
Iteration 60, loss = 0.0215
Iteration 80, loss = 0.0171
--- Epoch 532 / 100000
Iteration 0, loss = 0.0138
Iteration 20, loss = 0.0249
Iteration 40, loss = 0.0303
Iteration 60, loss = 0.0396
Iteration 80, loss = 0.0184
--- Epoch 533 / 100000
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0147
Iteration 60, loss = 0.0175
Iteration 80, loss = 0.0088
--- Epoch 534 / 100000
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0191
Iteration 40, loss = 0.0136
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0146
--- Epoch 535 / 100000
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0321
Iteration 60, loss = 0.0162
Iteration 80, loss = 0.0336
--- Epoch 536 / 100000
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0261
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0133
Iteration 80, loss = 0.0194
--- Epoch 537 / 100000
Iteration 0, loss = 0.0260
Iteration 20, loss = 0.0475
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0169
--- Epoch 538 / 100000
Iteration 0, loss = 0.0135
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0246
Iteration 80, loss = 0.0264
--- Epoch 539 / 100000
Iteration 0, loss = 0.0169
Iteration 20, loss = 0.0312
Iteration 40, loss = 0.0182
Iteration 60, loss = 0.0247
Iteration 80, loss = 0.0132
--- Epoch 540 / 100000
Iteration 0, loss = 0.0218
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0244
Iteration 60, loss = 0.0175
Iteration 80, loss = 0.0159
--- Epoch 541 / 100000
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0211
Iteration 40, loss = 0.0148
Iteration 60, loss = 0.0190
Iteration 80, loss = 0.0075
--- Epoch 542 / 100000
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0147
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0171
Iteration 80, loss = 0.0106
--- Epoch 543 / 100000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0181
Iteration 80, loss = 0.0119
--- Epoch 544 / 100000
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0301
--- Epoch 545 / 100000
Iteration 0, loss = 0.0180
Iteration 20, loss = 0.0299
Iteration 40, loss = 0.0226
Iteration 60, loss = 0.0097
Iteration 80, loss = 0.0071
--- Epoch 546 / 100000
Iteration 0, loss = 0.0170
Iteration 20, loss = 0.0211
Iteration 40, loss = 0.0139
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0121
--- Epoch 547 / 100000
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0283
Iteration 40, loss = 0.0137
Iteration 60, loss = 0.0231
Iteration 80, loss = 0.0141
--- Epoch 548 / 100000
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0371
Iteration 40, loss = 0.0189
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0246
--- Epoch 549 / 100000
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0200
Iteration 80, loss = 0.0109
--- Epoch 550 / 100000
Iteration 0, loss = 0.0141
Iteration 20, loss = 0.0210
Iteration 40, loss = 0.0284
Iteration 60, loss = 0.0192
Iteration 80, loss = 0.0207
--- Epoch 551 / 100000
Iteration 0, loss = 0.0163
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0166
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0109
--- Epoch 552 / 100000
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0166
Iteration 40, loss = 0.0135
Iteration 60, loss = 0.0154
Iteration 80, loss = 0.0099
--- Epoch 553 / 100000
Iteration 0, loss = 0.0195
Iteration 20, loss = 0.0190
Iteration 40, loss = 0.0325
Iteration 60, loss = 0.0307
Iteration 80, loss = 0.0207
--- Epoch 554 / 100000
Iteration 0, loss = 0.0141
Iteration 20, loss = 0.0202
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0198
Iteration 80, loss = 0.0140
--- Epoch 555 / 100000
Iteration 0, loss = 0.0208
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0182
Iteration 60, loss = 0.0199
Iteration 80, loss = 0.0107
--- Epoch 556 / 100000
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0213
Iteration 40, loss = 0.0277
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0141
--- Epoch 557 / 100000
Iteration 0, loss = 0.0157
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0144
Iteration 60, loss = 0.0189
Iteration 80, loss = 0.0174
--- Epoch 558 / 100000
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0181
Iteration 60, loss = 0.0138
Iteration 80, loss = 0.0182
--- Epoch 559 / 100000
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0116
Iteration 80, loss = 0.0151
--- Epoch 560 / 100000
Iteration 0, loss = 0.0233
Iteration 20, loss = 0.0196
Iteration 40, loss = 0.0181
Iteration 60, loss = 0.0134
Iteration 80, loss = 0.0156
--- Epoch 561 / 100000
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0172
Iteration 40, loss = 0.0217
Iteration 60, loss = 0.0399
Iteration 80, loss = 0.0123
--- Epoch 562 / 100000
Iteration 0, loss = 0.0166
Iteration 20, loss = 0.0230
Iteration 40, loss = 0.0287
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0454
--- Epoch 563 / 100000
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0156
Iteration 40, loss = 0.0156
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0136
--- Epoch 564 / 100000
Iteration 0, loss = 0.0145
Iteration 20, loss = 0.0162
Iteration 40, loss = 0.0121
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0289
--- Epoch 565 / 100000
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0165
Iteration 80, loss = 0.0263
--- Epoch 566 / 100000
Iteration 0, loss = 0.0368
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0080
--- Epoch 567 / 100000
Iteration 0, loss = 0.0160
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0217
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0394
--- Epoch 568 / 100000
Iteration 0, loss = 0.0131
Iteration 20, loss = 0.0250
Iteration 40, loss = 0.0200
Iteration 60, loss = 0.0197
Iteration 80, loss = 0.0076
--- Epoch 569 / 100000
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0160
Iteration 40, loss = 0.0182
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0118
--- Epoch 570 / 100000
Iteration 0, loss = 0.0190
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0170
Iteration 60, loss = 0.0196
Iteration 80, loss = 0.0079
--- Epoch 571 / 100000
Iteration 0, loss = 0.0202
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0319
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0192
--- Epoch 572 / 100000
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0183
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0089
--- Epoch 573 / 100000
Iteration 0, loss = 0.0232
Iteration 20, loss = 0.0245
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0161
--- Epoch 574 / 100000
Iteration 0, loss = 0.0235
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0331
Iteration 60, loss = 0.0160
Iteration 80, loss = 0.0272
--- Epoch 575 / 100000
Iteration 0, loss = 0.0201
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0118
--- Epoch 576 / 100000
Iteration 0, loss = 0.0180
Iteration 20, loss = 0.0475
Iteration 40, loss = 0.0267
Iteration 60, loss = 0.0131
Iteration 80, loss = 0.0261
--- Epoch 577 / 100000
Iteration 0, loss = 0.0202
Iteration 20, loss = 0.0160
Iteration 40, loss = 0.0105
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0120
--- Epoch 578 / 100000
Iteration 0, loss = 0.0123
Iteration 20, loss = 0.0256
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0202
Iteration 80, loss = 0.0170
--- Epoch 579 / 100000
Iteration 0, loss = 0.0222
Iteration 20, loss = 0.0192
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0384
Iteration 80, loss = 0.0200
--- Epoch 580 / 100000
Iteration 0, loss = 0.0152
Iteration 20, loss = 0.0141
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0148
Iteration 80, loss = 0.0187
--- Epoch 581 / 100000
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0195
Iteration 60, loss = 0.0228
Iteration 80, loss = 0.0111
--- Epoch 582 / 100000
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0148
Iteration 60, loss = 0.0206
Iteration 80, loss = 0.0131
--- Epoch 583 / 100000
Iteration 0, loss = 0.0138
Iteration 20, loss = 0.0173
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0209
--- Epoch 584 / 100000
Iteration 0, loss = 0.0290
Iteration 20, loss = 0.0124
Iteration 40, loss = 0.0208
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0183
--- Epoch 585 / 100000
Iteration 0, loss = 0.0205
Iteration 20, loss = 0.0117
Iteration 40, loss = 0.0139
Iteration 60, loss = 0.0275
Iteration 80, loss = 0.0269
--- Epoch 586 / 100000
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0402
Iteration 40, loss = 0.0198
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0093
--- Epoch 587 / 100000
Iteration 0, loss = 0.0165
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0145
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0220
--- Epoch 588 / 100000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0200
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0150
Iteration 80, loss = 0.0109
--- Epoch 589 / 100000
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0140
Iteration 40, loss = 0.0350
Iteration 60, loss = 0.0150
Iteration 80, loss = 0.0262
--- Epoch 590 / 100000
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0264
Iteration 60, loss = 0.0241
Iteration 80, loss = 0.0072
--- Epoch 591 / 100000
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0124
Iteration 60, loss = 0.0181
Iteration 80, loss = 0.0141
--- Epoch 592 / 100000
Iteration 0, loss = 0.0103
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0156
--- Epoch 593 / 100000
Iteration 0, loss = 0.0162
Iteration 20, loss = 0.0166
Iteration 40, loss = 0.0169
Iteration 60, loss = 0.0218
Iteration 80, loss = 0.0096
--- Epoch 594 / 100000
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0232
Iteration 40, loss = 0.0188
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0148
--- Epoch 595 / 100000
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0176
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0093
--- Epoch 596 / 100000
Iteration 0, loss = 0.0215
Iteration 20, loss = 0.0207
Iteration 40, loss = 0.0137
Iteration 60, loss = 0.0177
Iteration 80, loss = 0.0252
--- Epoch 597 / 100000
Iteration 0, loss = 0.0161
Iteration 20, loss = 0.0447
Iteration 40, loss = 0.0163
Iteration 60, loss = 0.0169
Iteration 80, loss = 0.0214
--- Epoch 598 / 100000
Iteration 0, loss = 0.0257
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0170
Iteration 60, loss = 0.0102
Iteration 80, loss = 0.0096
--- Epoch 599 / 100000
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0113
Iteration 60, loss = 0.0190
Iteration 80, loss = 0.0212
--- Epoch 600 / 100000
Iteration 0, loss = 0.0137
Iteration 20, loss = 0.0286
Iteration 40, loss = 0.0294
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0211
--- Epoch 601 / 100000
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0259
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0177
Iteration 80, loss = 0.0204
--- Epoch 602 / 100000
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0162
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0209
--- Epoch 603 / 100000
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0187
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0191
Iteration 80, loss = 0.0097
--- Epoch 604 / 100000
Iteration 0, loss = 0.0166
Iteration 20, loss = 0.0207
Iteration 40, loss = 0.0287
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0137
--- Epoch 605 / 100000
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0140
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0189
Iteration 80, loss = 0.0085
--- Epoch 606 / 100000
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0154
Iteration 40, loss = 0.0139
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0192
--- Epoch 607 / 100000
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0290
Iteration 80, loss = 0.0200
--- Epoch 608 / 100000
Iteration 0, loss = 0.0138
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0097
Iteration 80, loss = 0.0108
--- Epoch 609 / 100000
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0215
Iteration 40, loss = 0.0266
Iteration 60, loss = 0.0206
Iteration 80, loss = 0.0112
--- Epoch 610 / 100000
Iteration 0, loss = 0.0655
Iteration 20, loss = 0.0145
Iteration 40, loss = 0.0157
Iteration 60, loss = 0.0192
Iteration 80, loss = 0.0088
--- Epoch 611 / 100000
Iteration 0, loss = 0.0383
Iteration 20, loss = 0.0351
Iteration 40, loss = 0.0173
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0160
--- Epoch 612 / 100000
Iteration 0, loss = 0.0168
Iteration 20, loss = 0.0151
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0119
--- Epoch 613 / 100000
Iteration 0, loss = 0.0179
Iteration 20, loss = 0.0243
Iteration 40, loss = 0.0155
Iteration 60, loss = 0.0187
Iteration 80, loss = 0.0166
--- Epoch 614 / 100000
Iteration 0, loss = 0.0101
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0215
Iteration 80, loss = 0.0118
--- Epoch 615 / 100000
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0086
Iteration 40, loss = 0.0267
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0121
--- Epoch 616 / 100000
Iteration 0, loss = 0.0135
Iteration 20, loss = 0.0166
Iteration 40, loss = 0.0195
Iteration 60, loss = 0.0210
Iteration 80, loss = 0.0180
--- Epoch 617 / 100000
Iteration 0, loss = 0.0276
Iteration 20, loss = 0.0178
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0121
--- Epoch 618 / 100000
Iteration 0, loss = 0.0182
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0223
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0182
--- Epoch 619 / 100000
Iteration 0, loss = 0.0207
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0225
--- Epoch 620 / 100000
Iteration 0, loss = 0.0151
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0473
Iteration 80, loss = 0.0171
--- Epoch 621 / 100000
Iteration 0, loss = 0.0139
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0148
--- Epoch 622 / 100000
Iteration 0, loss = 0.0250
Iteration 20, loss = 0.0333
Iteration 40, loss = 0.0175
Iteration 60, loss = 0.0216
Iteration 80, loss = 0.0229
--- Epoch 623 / 100000
Iteration 0, loss = 0.0182
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0154
Iteration 60, loss = 0.0111
Iteration 80, loss = 0.0131
--- Epoch 624 / 100000
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0475
Iteration 40, loss = 0.0222
Iteration 60, loss = 0.0131
Iteration 80, loss = 0.0141
--- Epoch 625 / 100000
Iteration 0, loss = 0.0322
Iteration 20, loss = 0.0131
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0143
--- Epoch 626 / 100000
Iteration 0, loss = 0.0273
Iteration 20, loss = 0.0187
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0152
--- Epoch 627 / 100000
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0181
Iteration 60, loss = 0.0315
Iteration 80, loss = 0.0144
--- Epoch 628 / 100000
Iteration 0, loss = 0.0176
Iteration 20, loss = 0.0277
Iteration 40, loss = 0.0129
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0089
--- Epoch 629 / 100000
Iteration 0, loss = 0.0254
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0434
Iteration 60, loss = 0.0195
Iteration 80, loss = 0.0172
--- Epoch 630 / 100000
Iteration 0, loss = 0.0163
Iteration 20, loss = 0.0175
Iteration 40, loss = 0.0448
Iteration 60, loss = 0.0313
Iteration 80, loss = 0.0222
--- Epoch 631 / 100000
Iteration 0, loss = 0.0200
Iteration 20, loss = 0.0227
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0298
Iteration 80, loss = 0.0129
--- Epoch 632 / 100000
Iteration 0, loss = 0.0201
Iteration 20, loss = 0.0245
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0268
Iteration 80, loss = 0.0098
--- Epoch 633 / 100000
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0194
Iteration 60, loss = 0.0274
Iteration 80, loss = 0.0185
--- Epoch 634 / 100000
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0425
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0107
--- Epoch 635 / 100000
Iteration 0, loss = 0.0167
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0204
Iteration 60, loss = 0.0154
Iteration 80, loss = 0.0093
--- Epoch 636 / 100000
Iteration 0, loss = 0.0190
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0133
Iteration 80, loss = 0.0099
--- Epoch 637 / 100000
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0161
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0132
Iteration 80, loss = 0.0217
--- Epoch 638 / 100000
Iteration 0, loss = 0.0157
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0114
--- Epoch 639 / 100000
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0164
Iteration 60, loss = 0.0229
Iteration 80, loss = 0.0731
--- Epoch 640 / 100000
Iteration 0, loss = 0.0197
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0167
--- Epoch 641 / 100000
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0105
Iteration 60, loss = 0.0154
Iteration 80, loss = 0.0167
--- Epoch 642 / 100000
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0131
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0104
--- Epoch 643 / 100000
Iteration 0, loss = 0.0297
Iteration 20, loss = 0.0198
Iteration 40, loss = 0.0171
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0170
--- Epoch 644 / 100000
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0256
Iteration 40, loss = 0.0328
Iteration 60, loss = 0.0227
Iteration 80, loss = 0.0145
--- Epoch 645 / 100000
Iteration 0, loss = 0.0258
Iteration 20, loss = 0.0129
Iteration 40, loss = 0.0141
Iteration 60, loss = 0.0381
Iteration 80, loss = 0.0244
--- Epoch 646 / 100000
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0145
Iteration 40, loss = 0.0190
Iteration 60, loss = 0.0115
Iteration 80, loss = 0.0249
--- Epoch 647 / 100000
Iteration 0, loss = 0.0161
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0180
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0101
--- Epoch 648 / 100000
Iteration 0, loss = 0.0206
Iteration 20, loss = 0.0176
Iteration 40, loss = 0.0171
Iteration 60, loss = 0.0120
Iteration 80, loss = 0.0114
--- Epoch 649 / 100000
Iteration 0, loss = 0.0181
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0161
Iteration 60, loss = 0.0258
Iteration 80, loss = 0.0181
--- Epoch 650 / 100000
Iteration 0, loss = 0.0202
Iteration 20, loss = 0.0163
Iteration 40, loss = 0.0300
Iteration 60, loss = 0.0478
Iteration 80, loss = 0.0100
--- Epoch 651 / 100000
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0194
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0082
--- Epoch 652 / 100000
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0252
Iteration 80, loss = 0.0164
--- Epoch 653 / 100000
Iteration 0, loss = 0.0157
Iteration 20, loss = 0.0128
Iteration 40, loss = 0.0188
Iteration 60, loss = 0.0134
Iteration 80, loss = 0.0331
--- Epoch 654 / 100000
Iteration 0, loss = 0.0224
Iteration 20, loss = 0.0205
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0158
Iteration 80, loss = 0.0141
--- Epoch 655 / 100000
Iteration 0, loss = 0.0202
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0220
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0539
--- Epoch 656 / 100000
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0127
Iteration 80, loss = 0.0116
--- Epoch 657 / 100000
Iteration 0, loss = 0.0368
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0202
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0159
--- Epoch 658 / 100000
Iteration 0, loss = 0.0198
Iteration 20, loss = 0.0151
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0149
--- Epoch 659 / 100000
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0357
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0238
Iteration 80, loss = 0.0167
--- Epoch 660 / 100000
Iteration 0, loss = 0.0145
Iteration 20, loss = 0.0269
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0192
Iteration 80, loss = 0.0145
--- Epoch 661 / 100000
Iteration 0, loss = 0.0200
Iteration 20, loss = 0.0086
Iteration 40, loss = 0.0247
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0115
--- Epoch 662 / 100000
Iteration 0, loss = 0.0120
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0209
Iteration 80, loss = 0.0208
--- Epoch 663 / 100000
Iteration 0, loss = 0.0183
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0162
Iteration 80, loss = 0.0141
--- Epoch 664 / 100000
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0300
Iteration 60, loss = 0.0192
Iteration 80, loss = 0.0147
--- Epoch 665 / 100000
Iteration 0, loss = 0.0272
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0307
Iteration 80, loss = 0.0146
--- Epoch 666 / 100000
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0116
--- Epoch 667 / 100000
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0309
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0225
--- Epoch 668 / 100000
Iteration 0, loss = 0.0209
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0108
Iteration 80, loss = 0.0464
--- Epoch 669 / 100000
Iteration 0, loss = 0.0293
Iteration 20, loss = 0.0340
Iteration 40, loss = 0.0175
Iteration 60, loss = 0.0205
Iteration 80, loss = 0.0121
--- Epoch 670 / 100000
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0256
Iteration 80, loss = 0.0099
--- Epoch 671 / 100000
Iteration 0, loss = 0.0244
Iteration 20, loss = 0.0224
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0731
Iteration 80, loss = 0.0110
--- Epoch 672 / 100000
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0200
Iteration 40, loss = 0.0133
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0126
--- Epoch 673 / 100000
Iteration 0, loss = 0.0195
Iteration 20, loss = 0.0219
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0236
Iteration 80, loss = 0.0091
--- Epoch 674 / 100000
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0153
Iteration 40, loss = 0.0167
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0162
--- Epoch 675 / 100000
Iteration 0, loss = 0.0103
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0162
Iteration 60, loss = 0.0208
Iteration 80, loss = 0.0165
--- Epoch 676 / 100000
Iteration 0, loss = 0.0152
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0492
Iteration 60, loss = 0.0242
Iteration 80, loss = 0.0179
--- Epoch 677 / 100000
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0151
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0238
--- Epoch 678 / 100000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0159
Iteration 40, loss = 0.0172
Iteration 60, loss = 0.0185
Iteration 80, loss = 0.0143
--- Epoch 679 / 100000
Iteration 0, loss = 0.0209
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0153
Iteration 80, loss = 0.0293
--- Epoch 680 / 100000
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0176
Iteration 60, loss = 0.0179
Iteration 80, loss = 0.0142
--- Epoch 681 / 100000
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0306
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0224
Iteration 80, loss = 0.0141
--- Epoch 682 / 100000
Iteration 0, loss = 0.0211
Iteration 20, loss = 0.0220
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0173
Iteration 80, loss = 0.0104
--- Epoch 683 / 100000
Iteration 0, loss = 0.0349
Iteration 20, loss = 0.0162
Iteration 40, loss = 0.0237
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0099
--- Epoch 684 / 100000
Iteration 0, loss = 0.0171
Iteration 20, loss = 0.0086
Iteration 40, loss = 0.0123
Iteration 60, loss = 0.0213
Iteration 80, loss = 0.0119
--- Epoch 685 / 100000
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0165
--- Epoch 686 / 100000
Iteration 0, loss = 0.0253
Iteration 20, loss = 0.0169
Iteration 40, loss = 0.0217
Iteration 60, loss = 0.0316
Iteration 80, loss = 0.0216
--- Epoch 687 / 100000
Iteration 0, loss = 0.0180
Iteration 20, loss = 0.0168
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0357
Iteration 80, loss = 0.0171
--- Epoch 688 / 100000
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0129
Iteration 40, loss = 0.0172
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0133
--- Epoch 689 / 100000
Iteration 0, loss = 0.0255
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0172
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0134
--- Epoch 690 / 100000
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0194
Iteration 40, loss = 0.0191
Iteration 60, loss = 0.0267
Iteration 80, loss = 0.0158
--- Epoch 691 / 100000
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0307
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0176
--- Epoch 692 / 100000
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0208
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0070
--- Epoch 693 / 100000
Iteration 0, loss = 0.0198
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0225
Iteration 80, loss = 0.0143
--- Epoch 694 / 100000
Iteration 0, loss = 0.0402
Iteration 20, loss = 0.0204
Iteration 40, loss = 0.0229
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0115
--- Epoch 695 / 100000
Iteration 0, loss = 0.0141
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0239
--- Epoch 696 / 100000
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0378
Iteration 80, loss = 0.0139
--- Epoch 697 / 100000
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0112
Iteration 40, loss = 0.0183
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0114
--- Epoch 698 / 100000
Iteration 0, loss = 0.0131
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0147
Iteration 60, loss = 0.0189
Iteration 80, loss = 0.0195
--- Epoch 699 / 100000
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0194
Iteration 40, loss = 0.0257
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0190
--- Epoch 700 / 100000
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0148
Iteration 40, loss = 0.0198
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0165
--- Epoch 701 / 100000
Iteration 0, loss = 0.0161
Iteration 20, loss = 0.0227
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0124
--- Epoch 702 / 100000
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0147
--- Epoch 703 / 100000
Iteration 0, loss = 0.0138
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0158
Iteration 60, loss = 0.0351
Iteration 80, loss = 0.0118
--- Epoch 704 / 100000
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0152
Iteration 60, loss = 0.0125
Iteration 80, loss = 0.0136
--- Epoch 705 / 100000
Iteration 0, loss = 0.0192
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0146
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0084
--- Epoch 706 / 100000
Iteration 0, loss = 0.0247
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0230
Iteration 80, loss = 0.0178
--- Epoch 707 / 100000
Iteration 0, loss = 0.0163
Iteration 20, loss = 0.0131
Iteration 40, loss = 0.0158
Iteration 60, loss = 0.0168
Iteration 80, loss = 0.0107
--- Epoch 708 / 100000
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0222
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0243
Iteration 80, loss = 0.0182
--- Epoch 709 / 100000
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0217
Iteration 60, loss = 0.0417
Iteration 80, loss = 0.0219
--- Epoch 710 / 100000
Iteration 0, loss = 0.0170
Iteration 20, loss = 0.0137
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0151
Iteration 80, loss = 0.0325
--- Epoch 711 / 100000
Iteration 0, loss = 0.0158
Iteration 20, loss = 0.0185
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0290
Iteration 80, loss = 0.0244
--- Epoch 712 / 100000
Iteration 0, loss = 0.0331
Iteration 20, loss = 0.0128
Iteration 40, loss = 0.0449
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0223
--- Epoch 713 / 100000
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0115
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0136
--- Epoch 714 / 100000
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0241
Iteration 40, loss = 0.0166
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0106
--- Epoch 715 / 100000
Iteration 0, loss = 0.0150
Iteration 20, loss = 0.0156
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0209
--- Epoch 716 / 100000
Iteration 0, loss = 0.0204
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0162
Iteration 60, loss = 0.0150
Iteration 80, loss = 0.0129
--- Epoch 717 / 100000
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0153
Iteration 60, loss = 0.0153
Iteration 80, loss = 0.0076
--- Epoch 718 / 100000
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0198
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0175
Iteration 80, loss = 0.0139
--- Epoch 719 / 100000
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0176
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0156
--- Epoch 720 / 100000
Iteration 0, loss = 0.0177
Iteration 20, loss = 0.0112
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0292
Iteration 80, loss = 0.0148
--- Epoch 721 / 100000
Iteration 0, loss = 0.0210
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0192
Iteration 80, loss = 0.0200
--- Epoch 722 / 100000
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0153
Iteration 40, loss = 0.0148
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0126
--- Epoch 723 / 100000
Iteration 0, loss = 0.0168
Iteration 20, loss = 0.0185
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0162
Iteration 80, loss = 0.0160
--- Epoch 724 / 100000
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0202
Iteration 80, loss = 0.0068
--- Epoch 725 / 100000
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0187
Iteration 40, loss = 0.0110
Iteration 60, loss = 0.0102
Iteration 80, loss = 0.0259
--- Epoch 726 / 100000
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0247
--- Epoch 727 / 100000
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0137
Iteration 60, loss = 0.0208
Iteration 80, loss = 0.0225
--- Epoch 728 / 100000
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0206
Iteration 80, loss = 0.0169
--- Epoch 729 / 100000
Iteration 0, loss = 0.0193
Iteration 20, loss = 0.0210
Iteration 40, loss = 0.0156
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0247
--- Epoch 730 / 100000
Iteration 0, loss = 0.0150
Iteration 20, loss = 0.0181
Iteration 40, loss = 0.0167
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0097
--- Epoch 731 / 100000
Iteration 0, loss = 0.0152
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0242
Iteration 80, loss = 0.0227
--- Epoch 732 / 100000
Iteration 0, loss = 0.0200
Iteration 20, loss = 0.0133
Iteration 40, loss = 0.0144
Iteration 60, loss = 0.0120
Iteration 80, loss = 0.0134
--- Epoch 733 / 100000
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0196
Iteration 60, loss = 0.0209
Iteration 80, loss = 0.0230
--- Epoch 734 / 100000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0265
Iteration 40, loss = 0.0176
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0281
--- Epoch 735 / 100000
Iteration 0, loss = 0.0497
Iteration 20, loss = 0.0148
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0200
Iteration 80, loss = 0.0142
--- Epoch 736 / 100000
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0144
Iteration 40, loss = 0.0258
Iteration 60, loss = 0.0268
Iteration 80, loss = 0.0118
--- Epoch 737 / 100000
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0254
Iteration 80, loss = 0.0162
--- Epoch 738 / 100000
Iteration 0, loss = 0.0227
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0233
Iteration 80, loss = 0.0176
--- Epoch 739 / 100000
Iteration 0, loss = 0.0109
Iteration 20, loss = 0.0156
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0186
Iteration 80, loss = 0.0129
--- Epoch 740 / 100000
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0153
Iteration 40, loss = 0.0134
Iteration 60, loss = 0.0185
Iteration 80, loss = 0.0096
--- Epoch 741 / 100000
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0185
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0103
--- Epoch 742 / 100000
Iteration 0, loss = 0.0233
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0443
Iteration 60, loss = 0.0248
Iteration 80, loss = 0.0105
--- Epoch 743 / 100000
Iteration 0, loss = 0.0127
Iteration 20, loss = 0.0115
Iteration 40, loss = 0.0239
Iteration 60, loss = 0.0101
Iteration 80, loss = 0.0196
--- Epoch 744 / 100000
Iteration 0, loss = 0.0182
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0179
Iteration 80, loss = 0.0209
--- Epoch 745 / 100000
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0198
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0232
Iteration 80, loss = 0.0089
--- Epoch 746 / 100000
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0126
--- Epoch 747 / 100000
Iteration 0, loss = 0.0209
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0142
Iteration 80, loss = 0.0262
--- Epoch 748 / 100000
Iteration 0, loss = 0.0220
Iteration 20, loss = 0.0112
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0114
--- Epoch 749 / 100000
Iteration 0, loss = 0.0213
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0116
Iteration 80, loss = 0.0097
--- Epoch 750 / 100000
Iteration 0, loss = 0.0185
Iteration 20, loss = 0.0161
Iteration 40, loss = 0.0431
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0090
--- Epoch 751 / 100000
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0419
Iteration 40, loss = 0.0139
Iteration 60, loss = 0.0578
Iteration 80, loss = 0.0144
--- Epoch 752 / 100000
Iteration 0, loss = 0.0170
Iteration 20, loss = 0.0193
Iteration 40, loss = 0.0193
Iteration 60, loss = 0.0191
Iteration 80, loss = 0.0219
--- Epoch 753 / 100000
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0239
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0424
--- Epoch 754 / 100000
Iteration 0, loss = 0.0208
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0176
--- Epoch 755 / 100000
Iteration 0, loss = 0.0266
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0183
Iteration 80, loss = 0.0245
--- Epoch 756 / 100000
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0167
Iteration 40, loss = 0.0254
Iteration 60, loss = 0.0132
Iteration 80, loss = 0.0140
--- Epoch 757 / 100000
Iteration 0, loss = 0.0153
Iteration 20, loss = 0.0307
Iteration 40, loss = 0.0199
Iteration 60, loss = 0.0148
Iteration 80, loss = 0.0108
--- Epoch 758 / 100000
Iteration 0, loss = 0.0233
Iteration 20, loss = 0.0157
Iteration 40, loss = 0.0151
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0084
--- Epoch 759 / 100000
Iteration 0, loss = 0.0179
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0231
Iteration 60, loss = 0.0239
Iteration 80, loss = 0.0324
--- Epoch 760 / 100000
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0336
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0138
--- Epoch 761 / 100000
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0269
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0128
Iteration 80, loss = 0.0090
--- Epoch 762 / 100000
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0267
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0198
--- Epoch 763 / 100000
Iteration 0, loss = 0.0288
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0242
Iteration 60, loss = 0.0382
Iteration 80, loss = 0.0124
--- Epoch 764 / 100000
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0422
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0175
--- Epoch 765 / 100000
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0144
Iteration 40, loss = 0.0153
Iteration 60, loss = 0.0231
Iteration 80, loss = 0.0148
--- Epoch 766 / 100000
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0147
Iteration 60, loss = 0.0170
Iteration 80, loss = 0.0177
--- Epoch 767 / 100000
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0155
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0307
--- Epoch 768 / 100000
Iteration 0, loss = 0.0153
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0218
Iteration 60, loss = 0.0167
Iteration 80, loss = 0.0130
--- Epoch 769 / 100000
Iteration 0, loss = 0.0166
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0165
Iteration 60, loss = 0.0193
Iteration 80, loss = 0.0125
--- Epoch 770 / 100000
Iteration 0, loss = 0.0217
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0204
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0132
--- Epoch 771 / 100000
Iteration 0, loss = 0.0244
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0159
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0284
--- Epoch 772 / 100000
Iteration 0, loss = 0.0131
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0118
--- Epoch 773 / 100000
Iteration 0, loss = 0.0084
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0213
--- Epoch 774 / 100000
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0099
--- Epoch 775 / 100000
Iteration 0, loss = 0.0211
Iteration 20, loss = 0.0128
Iteration 40, loss = 0.0188
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0146
--- Epoch 776 / 100000
Iteration 0, loss = 0.0163
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0219
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0286
--- Epoch 777 / 100000
Iteration 0, loss = 0.0101
Iteration 20, loss = 0.0144
Iteration 40, loss = 0.0409
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0110
--- Epoch 778 / 100000
Iteration 0, loss = 0.0362
Iteration 20, loss = 0.0151
Iteration 40, loss = 0.0329
Iteration 60, loss = 0.0222
Iteration 80, loss = 0.0103
--- Epoch 779 / 100000
Iteration 0, loss = 0.0278
Iteration 20, loss = 0.0190
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0148
Iteration 80, loss = 0.0113
--- Epoch 780 / 100000
Iteration 0, loss = 0.0297
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0148
--- Epoch 781 / 100000
Iteration 0, loss = 0.0198
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0199
Iteration 60, loss = 0.0207
Iteration 80, loss = 0.0191
--- Epoch 782 / 100000
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0254
Iteration 40, loss = 0.0286
Iteration 60, loss = 0.0133
Iteration 80, loss = 0.0084
--- Epoch 783 / 100000
Iteration 0, loss = 0.0192
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0142
Iteration 80, loss = 0.0187
--- Epoch 784 / 100000
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0182
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0085
--- Epoch 785 / 100000
Iteration 0, loss = 0.0168
Iteration 20, loss = 0.0199
Iteration 40, loss = 0.0167
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0169
--- Epoch 786 / 100000
Iteration 0, loss = 0.0191
Iteration 20, loss = 0.0485
Iteration 40, loss = 0.0245
Iteration 60, loss = 0.0202
Iteration 80, loss = 0.0299
--- Epoch 787 / 100000
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0247
Iteration 60, loss = 0.0182
Iteration 80, loss = 0.0159
--- Epoch 788 / 100000
Iteration 0, loss = 0.0109
Iteration 20, loss = 0.0162
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0104
--- Epoch 789 / 100000
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0322
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0203
Iteration 80, loss = 0.0163
--- Epoch 790 / 100000
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0161
Iteration 80, loss = 0.0129
--- Epoch 791 / 100000
Iteration 0, loss = 0.0189
Iteration 20, loss = 0.0147
Iteration 40, loss = 0.0245
Iteration 60, loss = 0.0144
Iteration 80, loss = 0.0094
--- Epoch 792 / 100000
Iteration 0, loss = 0.0135
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0100
--- Epoch 793 / 100000
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0146
Iteration 40, loss = 0.0168
Iteration 60, loss = 0.0169
Iteration 80, loss = 0.0117
--- Epoch 794 / 100000
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0193
Iteration 40, loss = 0.0213
Iteration 60, loss = 0.0160
Iteration 80, loss = 0.0103
--- Epoch 795 / 100000
Iteration 0, loss = 0.0154
Iteration 20, loss = 0.0245
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0181
Iteration 80, loss = 0.0196
--- Epoch 796 / 100000
Iteration 0, loss = 0.0245
Iteration 20, loss = 0.0176
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0181
Iteration 80, loss = 0.0098
--- Epoch 797 / 100000
Iteration 0, loss = 0.0161
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0233
Iteration 60, loss = 0.0186
Iteration 80, loss = 0.0198
--- Epoch 798 / 100000
Iteration 0, loss = 0.0329
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0172
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0118
--- Epoch 799 / 100000
Iteration 0, loss = 0.0231
Iteration 20, loss = 0.0163
Iteration 40, loss = 0.0169
Iteration 60, loss = 0.0221
Iteration 80, loss = 0.0144
--- Epoch 800 / 100000
Iteration 0, loss = 0.0220
Iteration 20, loss = 0.0159
Iteration 40, loss = 0.0217
Iteration 60, loss = 0.0197
Iteration 80, loss = 0.0120
--- Epoch 801 / 100000
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0165
Iteration 80, loss = 0.0170
--- Epoch 802 / 100000
Iteration 0, loss = 0.0128
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0227
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0103
--- Epoch 803 / 100000
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0173
Iteration 80, loss = 0.0246
--- Epoch 804 / 100000
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0168
Iteration 80, loss = 0.0115
--- Epoch 805 / 100000
Iteration 0, loss = 0.0084
Iteration 20, loss = 0.0172
Iteration 40, loss = 0.0189
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0096
--- Epoch 806 / 100000
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0137
Iteration 40, loss = 0.0131
Iteration 60, loss = 0.0111
Iteration 80, loss = 0.0145
--- Epoch 807 / 100000
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0156
Iteration 80, loss = 0.0156
--- Epoch 808 / 100000
Iteration 0, loss = 0.0369
Iteration 20, loss = 0.0207
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0182
--- Epoch 809 / 100000
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0163
--- Epoch 810 / 100000
Iteration 0, loss = 0.0186
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0248
Iteration 60, loss = 0.0163
Iteration 80, loss = 0.0600
--- Epoch 811 / 100000
Iteration 0, loss = 0.0199
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0157
--- Epoch 812 / 100000
Iteration 0, loss = 0.0192
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0102
Iteration 80, loss = 0.0162
--- Epoch 813 / 100000
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0203
Iteration 80, loss = 0.0122
--- Epoch 814 / 100000
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0194
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0194
Iteration 80, loss = 0.0182
--- Epoch 815 / 100000
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0123
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0172
--- Epoch 816 / 100000
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0099
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0171
Iteration 80, loss = 0.0107
--- Epoch 817 / 100000
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0200
Iteration 40, loss = 0.0265
Iteration 60, loss = 0.0224
Iteration 80, loss = 0.0229
--- Epoch 818 / 100000
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0190
Iteration 60, loss = 0.0216
Iteration 80, loss = 0.0098
--- Epoch 819 / 100000
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0259
Iteration 40, loss = 0.0169
Iteration 60, loss = 0.0331
Iteration 80, loss = 0.0183
--- Epoch 820 / 100000
Iteration 0, loss = 0.0208
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0303
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0172
--- Epoch 821 / 100000
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0158
--- Epoch 822 / 100000
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0198
Iteration 40, loss = 0.0257
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0098
--- Epoch 823 / 100000
Iteration 0, loss = 0.0165
Iteration 20, loss = 0.0227
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0070
--- Epoch 824 / 100000
Iteration 0, loss = 0.0305
Iteration 20, loss = 0.0148
Iteration 40, loss = 0.0262
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0129
--- Epoch 825 / 100000
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0153
Iteration 40, loss = 0.0153
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0302
--- Epoch 826 / 100000
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0175
Iteration 80, loss = 0.0206
--- Epoch 827 / 100000
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0156
Iteration 40, loss = 0.0134
Iteration 60, loss = 0.0302
Iteration 80, loss = 0.0263
--- Epoch 828 / 100000
Iteration 0, loss = 0.0137
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0247
--- Epoch 829 / 100000
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0328
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0163
--- Epoch 830 / 100000
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0254
Iteration 60, loss = 0.0150
Iteration 80, loss = 0.0104
--- Epoch 831 / 100000
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0146
Iteration 60, loss = 0.0217
Iteration 80, loss = 0.0153
--- Epoch 832 / 100000
Iteration 0, loss = 0.0165
Iteration 20, loss = 0.0148
Iteration 40, loss = 0.0169
Iteration 60, loss = 0.0283
Iteration 80, loss = 0.0122
--- Epoch 833 / 100000
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0137
Iteration 40, loss = 0.0234
Iteration 60, loss = 0.0120
Iteration 80, loss = 0.0083
--- Epoch 834 / 100000
Iteration 0, loss = 0.0238
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0281
Iteration 60, loss = 0.0210
Iteration 80, loss = 0.0197
--- Epoch 835 / 100000
Iteration 0, loss = 0.0153
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0262
--- Epoch 836 / 100000
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0196
Iteration 40, loss = 0.0201
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0128
--- Epoch 837 / 100000
Iteration 0, loss = 0.0244
Iteration 20, loss = 0.0151
Iteration 40, loss = 0.0113
Iteration 60, loss = 0.0240
Iteration 80, loss = 0.0197
--- Epoch 838 / 100000
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0294
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0131
--- Epoch 839 / 100000
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0139
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0144
--- Epoch 840 / 100000
Iteration 0, loss = 0.0082
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0122
--- Epoch 841 / 100000
Iteration 0, loss = 0.0219
Iteration 20, loss = 0.0208
Iteration 40, loss = 0.0266
Iteration 60, loss = 0.0290
Iteration 80, loss = 0.0088
--- Epoch 842 / 100000
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0107
--- Epoch 843 / 100000
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0111
Iteration 80, loss = 0.0190
--- Epoch 844 / 100000
Iteration 0, loss = 0.0189
Iteration 20, loss = 0.0108
Iteration 40, loss = 0.0320
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0234
--- Epoch 845 / 100000
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0240
Iteration 80, loss = 0.0118
--- Epoch 846 / 100000
Iteration 0, loss = 0.0177
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0396
Iteration 60, loss = 0.0408
Iteration 80, loss = 0.0158
--- Epoch 847 / 100000
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0185
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0062
--- Epoch 848 / 100000
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0213
Iteration 80, loss = 0.0114
--- Epoch 849 / 100000
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0539
Iteration 80, loss = 0.0182
--- Epoch 850 / 100000
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0153
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0268
Iteration 80, loss = 0.0120
--- Epoch 851 / 100000
Iteration 0, loss = 0.0177
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0159
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0114
--- Epoch 852 / 100000
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0154
Iteration 40, loss = 0.0229
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0134
--- Epoch 853 / 100000
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0174
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0473
Iteration 80, loss = 0.0124
--- Epoch 854 / 100000
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0166
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0144
Iteration 80, loss = 0.0181
--- Epoch 855 / 100000
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0298
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0135
--- Epoch 856 / 100000
Iteration 0, loss = 0.0175
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0164
Iteration 60, loss = 0.0210
Iteration 80, loss = 0.0262
--- Epoch 857 / 100000
Iteration 0, loss = 0.0141
Iteration 20, loss = 0.0166
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0081
--- Epoch 858 / 100000
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0154
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0125
Iteration 80, loss = 0.0122
--- Epoch 859 / 100000
Iteration 0, loss = 0.0300
Iteration 20, loss = 0.0356
Iteration 40, loss = 0.0367
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0346
--- Epoch 860 / 100000
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0177
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0245
--- Epoch 861 / 100000
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0496
Iteration 40, loss = 0.0136
Iteration 60, loss = 0.0121
Iteration 80, loss = 0.0353
--- Epoch 862 / 100000
Iteration 0, loss = 0.0165
Iteration 20, loss = 0.0289
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0074
--- Epoch 863 / 100000
Iteration 0, loss = 0.0216
Iteration 20, loss = 0.0201
Iteration 40, loss = 0.0205
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0267
--- Epoch 864 / 100000
Iteration 0, loss = 0.0246
Iteration 20, loss = 0.0429
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0109
--- Epoch 865 / 100000
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0167
Iteration 40, loss = 0.0139
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0146
--- Epoch 866 / 100000
Iteration 0, loss = 0.0152
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0199
Iteration 80, loss = 0.0114
--- Epoch 867 / 100000
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0153
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0123
--- Epoch 868 / 100000
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0161
Iteration 80, loss = 0.0193
--- Epoch 869 / 100000
Iteration 0, loss = 0.0172
Iteration 20, loss = 0.0148
Iteration 40, loss = 0.0628
Iteration 60, loss = 0.0102
Iteration 80, loss = 0.0102
--- Epoch 870 / 100000
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0133
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0326
Iteration 80, loss = 0.0107
--- Epoch 871 / 100000
Iteration 0, loss = 0.0315
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0113
Iteration 60, loss = 0.0102
Iteration 80, loss = 0.0282
--- Epoch 872 / 100000
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0154
Iteration 40, loss = 0.0191
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0152
--- Epoch 873 / 100000
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0201
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0151
Iteration 80, loss = 0.0148
--- Epoch 874 / 100000
Iteration 0, loss = 0.0158
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0338
--- Epoch 875 / 100000
Iteration 0, loss = 0.0349
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0183
Iteration 80, loss = 0.0205
--- Epoch 876 / 100000
Iteration 0, loss = 0.0162
Iteration 20, loss = 0.0193
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0184
Iteration 80, loss = 0.0273
--- Epoch 877 / 100000
Iteration 0, loss = 0.0172
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0192
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0312
--- Epoch 878 / 100000
Iteration 0, loss = 0.0175
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0321
Iteration 60, loss = 0.0127
Iteration 80, loss = 0.0082
--- Epoch 879 / 100000
Iteration 0, loss = 0.0184
Iteration 20, loss = 0.0231
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0117
--- Epoch 880 / 100000
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0213
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0099
--- Epoch 881 / 100000
Iteration 0, loss = 0.0128
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0186
--- Epoch 882 / 100000
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0361
Iteration 60, loss = 0.0253
Iteration 80, loss = 0.0149
--- Epoch 883 / 100000
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0154
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0079
--- Epoch 884 / 100000
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0286
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0120
--- Epoch 885 / 100000
Iteration 0, loss = 0.0109
Iteration 20, loss = 0.0235
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0216
Iteration 80, loss = 0.0108
--- Epoch 886 / 100000
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0338
Iteration 60, loss = 0.0169
Iteration 80, loss = 0.0077
--- Epoch 887 / 100000
Iteration 0, loss = 0.0181
Iteration 20, loss = 0.0131
Iteration 40, loss = 0.0158
Iteration 60, loss = 0.0160
Iteration 80, loss = 0.0085
--- Epoch 888 / 100000
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0369
Iteration 40, loss = 0.0181
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0160
--- Epoch 889 / 100000
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0323
Iteration 80, loss = 0.0274
--- Epoch 890 / 100000
Iteration 0, loss = 0.0103
Iteration 20, loss = 0.0252
Iteration 40, loss = 0.0183
Iteration 60, loss = 0.0198
Iteration 80, loss = 0.0229
--- Epoch 891 / 100000
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0358
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0151
--- Epoch 892 / 100000
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0133
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0144
--- Epoch 893 / 100000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0245
Iteration 60, loss = 0.0413
Iteration 80, loss = 0.0129
--- Epoch 894 / 100000
Iteration 0, loss = 0.0183
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0173
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0073
--- Epoch 895 / 100000
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0164
Iteration 40, loss = 0.0217
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0194
--- Epoch 896 / 100000
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0180
Iteration 80, loss = 0.0117
--- Epoch 897 / 100000
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0147
Iteration 40, loss = 0.0194
Iteration 60, loss = 0.0293
Iteration 80, loss = 0.0153
--- Epoch 898 / 100000
Iteration 0, loss = 0.0208
Iteration 20, loss = 0.0233
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0138
Iteration 80, loss = 0.0130
--- Epoch 899 / 100000
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0169
Iteration 80, loss = 0.0175
--- Epoch 900 / 100000
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0133
Iteration 40, loss = 0.0131
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0124
--- Epoch 901 / 100000
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0263
Iteration 40, loss = 0.0160
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0161
--- Epoch 902 / 100000
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0264
Iteration 40, loss = 0.0257
Iteration 60, loss = 0.0195
Iteration 80, loss = 0.0205
--- Epoch 903 / 100000
Iteration 0, loss = 0.0335
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0081
--- Epoch 904 / 100000
Iteration 0, loss = 0.0158
Iteration 20, loss = 0.0419
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0151
Iteration 80, loss = 0.0135
--- Epoch 905 / 100000
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0181
Iteration 40, loss = 0.0176
Iteration 60, loss = 0.0148
Iteration 80, loss = 0.0238
--- Epoch 906 / 100000
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0123
Iteration 60, loss = 0.0173
Iteration 80, loss = 0.0158
--- Epoch 907 / 100000
Iteration 0, loss = 0.0123
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0168
Iteration 60, loss = 0.0234
Iteration 80, loss = 0.0166
--- Epoch 908 / 100000
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0224
Iteration 80, loss = 0.0108
--- Epoch 909 / 100000
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0229
Iteration 80, loss = 0.0090
--- Epoch 910 / 100000
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0402
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0247
Iteration 80, loss = 0.0421
--- Epoch 911 / 100000
Iteration 0, loss = 0.0165
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0334
Iteration 80, loss = 0.0163
--- Epoch 912 / 100000
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0186
Iteration 40, loss = 0.0131
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0145
--- Epoch 913 / 100000
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0194
Iteration 60, loss = 0.0142
Iteration 80, loss = 0.0121
--- Epoch 914 / 100000
Iteration 0, loss = 0.0195
Iteration 20, loss = 0.0265
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0260
Iteration 80, loss = 0.0140
--- Epoch 915 / 100000
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0198
Iteration 80, loss = 0.0100
--- Epoch 916 / 100000
Iteration 0, loss = 0.0181
Iteration 20, loss = 0.0205
Iteration 40, loss = 0.0175
Iteration 60, loss = 0.0120
Iteration 80, loss = 0.0218
--- Epoch 917 / 100000
Iteration 0, loss = 0.0197
Iteration 20, loss = 0.0269
Iteration 40, loss = 0.0162
Iteration 60, loss = 0.0157
Iteration 80, loss = 0.0099
--- Epoch 918 / 100000
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0180
Iteration 40, loss = 0.0170
Iteration 60, loss = 0.0145
Iteration 80, loss = 0.0212
--- Epoch 919 / 100000
Iteration 0, loss = 0.0362
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0136
Iteration 60, loss = 0.0166
Iteration 80, loss = 0.0161
--- Epoch 920 / 100000
Iteration 0, loss = 0.0196
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0138
Iteration 80, loss = 0.0147
--- Epoch 921 / 100000
Iteration 0, loss = 0.0180
Iteration 20, loss = 0.0170
Iteration 40, loss = 0.0200
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0145
--- Epoch 922 / 100000
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0141
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0115
--- Epoch 923 / 100000
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0181
Iteration 60, loss = 0.0138
Iteration 80, loss = 0.0250
--- Epoch 924 / 100000
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0176
Iteration 60, loss = 0.0280
Iteration 80, loss = 0.0213
--- Epoch 925 / 100000
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0153
Iteration 80, loss = 0.0158
--- Epoch 926 / 100000
Iteration 0, loss = 0.0262
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0263
Iteration 60, loss = 0.0127
Iteration 80, loss = 0.0144
--- Epoch 927 / 100000
Iteration 0, loss = 0.0223
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0166
Iteration 80, loss = 0.0198
--- Epoch 928 / 100000
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0193
Iteration 80, loss = 0.0099
--- Epoch 929 / 100000
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0084
--- Epoch 930 / 100000
Iteration 0, loss = 0.0153
Iteration 20, loss = 0.0164
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0208
Iteration 80, loss = 0.0233
--- Epoch 931 / 100000
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0125
Iteration 80, loss = 0.0157
--- Epoch 932 / 100000
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0300
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0153
--- Epoch 933 / 100000
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0147
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0110
--- Epoch 934 / 100000
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0132
Iteration 40, loss = 0.0134
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0197
--- Epoch 935 / 100000
Iteration 0, loss = 0.0292
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0232
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0126
--- Epoch 936 / 100000
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0133
Iteration 60, loss = 0.0162
Iteration 80, loss = 0.0283
--- Epoch 937 / 100000
Iteration 0, loss = 0.0139
Iteration 20, loss = 0.0278
Iteration 40, loss = 0.0303
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0660
--- Epoch 938 / 100000
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0283
Iteration 40, loss = 0.0190
Iteration 60, loss = 0.0111
Iteration 80, loss = 0.0137
--- Epoch 939 / 100000
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0226
Iteration 40, loss = 0.0188
Iteration 60, loss = 0.0123
Iteration 80, loss = 0.0085
--- Epoch 940 / 100000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0127
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0128
Iteration 80, loss = 0.0076
--- Epoch 941 / 100000
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0159
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0078
--- Epoch 942 / 100000
Iteration 0, loss = 0.0137
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0170
Iteration 80, loss = 0.0198
--- Epoch 943 / 100000
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0123
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0077
--- Epoch 944 / 100000
Iteration 0, loss = 0.0161
Iteration 20, loss = 0.0422
Iteration 40, loss = 0.0175
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0143
--- Epoch 945 / 100000
Iteration 0, loss = 0.0415
Iteration 20, loss = 0.0115
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0177
--- Epoch 946 / 100000
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0230
--- Epoch 947 / 100000
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0247
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0134
Iteration 80, loss = 0.0403
--- Epoch 948 / 100000
Iteration 0, loss = 0.0137
Iteration 20, loss = 0.0112
Iteration 40, loss = 0.0249
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0174
--- Epoch 949 / 100000
Iteration 0, loss = 0.0152
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0250
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0089
--- Epoch 950 / 100000
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0147
Iteration 60, loss = 0.0164
Iteration 80, loss = 0.0238
--- Epoch 951 / 100000
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0286
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0183
--- Epoch 952 / 100000
Iteration 0, loss = 0.0213
Iteration 20, loss = 0.0128
Iteration 40, loss = 0.0247
Iteration 60, loss = 0.0156
Iteration 80, loss = 0.0083
--- Epoch 953 / 100000
Iteration 0, loss = 0.0242
Iteration 20, loss = 0.0154
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0196
Iteration 80, loss = 0.0103
--- Epoch 954 / 100000
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0077
--- Epoch 955 / 100000
Iteration 0, loss = 0.0294
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0141
--- Epoch 956 / 100000
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0145
Iteration 60, loss = 0.0163
Iteration 80, loss = 0.0132
--- Epoch 957 / 100000
Iteration 0, loss = 0.0208
Iteration 20, loss = 0.0384
Iteration 40, loss = 0.0242
Iteration 60, loss = 0.0127
Iteration 80, loss = 0.0097
--- Epoch 958 / 100000
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0203
Iteration 60, loss = 0.0133
Iteration 80, loss = 0.0075
--- Epoch 959 / 100000
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0140
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0115
--- Epoch 960 / 100000
Iteration 0, loss = 0.0123
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0211
Iteration 60, loss = 0.0136
Iteration 80, loss = 0.0279
--- Epoch 961 / 100000
Iteration 0, loss = 0.0350
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0237
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0109
--- Epoch 962 / 100000
Iteration 0, loss = 0.0180
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0156
Iteration 80, loss = 0.0150
--- Epoch 963 / 100000
Iteration 0, loss = 0.0170
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0126
--- Epoch 964 / 100000
Iteration 0, loss = 0.0210
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0171
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0091
--- Epoch 965 / 100000
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0267
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0209
--- Epoch 966 / 100000
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0161
Iteration 80, loss = 0.0216
--- Epoch 967 / 100000
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0213
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0173
--- Epoch 968 / 100000
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0151
Iteration 80, loss = 0.0228
--- Epoch 969 / 100000
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0102
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0672
--- Epoch 970 / 100000
Iteration 0, loss = 0.0139
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0102
Iteration 60, loss = 0.0237
Iteration 80, loss = 0.0243
--- Epoch 971 / 100000
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0191
Iteration 40, loss = 0.0133
Iteration 60, loss = 0.0177
Iteration 80, loss = 0.0167
--- Epoch 972 / 100000
Iteration 0, loss = 0.0185
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0276
Iteration 60, loss = 0.0388
Iteration 80, loss = 0.0113
--- Epoch 973 / 100000
Iteration 0, loss = 0.0128
Iteration 20, loss = 0.0218
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0142
Iteration 80, loss = 0.0136
--- Epoch 974 / 100000
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0148
--- Epoch 975 / 100000
Iteration 0, loss = 0.0219
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0150
Iteration 80, loss = 0.0195
--- Epoch 976 / 100000
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0113
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0107
--- Epoch 977 / 100000
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0177
Iteration 80, loss = 0.0099
--- Epoch 978 / 100000
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0172
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0119
--- Epoch 979 / 100000
Iteration 0, loss = 0.0145
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0133
Iteration 80, loss = 0.0256
--- Epoch 980 / 100000
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0164
--- Epoch 981 / 100000
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0097
Iteration 80, loss = 0.0175
--- Epoch 982 / 100000
Iteration 0, loss = 0.0184
Iteration 20, loss = 0.0226
Iteration 40, loss = 0.0133
Iteration 60, loss = 0.0193
Iteration 80, loss = 0.0114
--- Epoch 983 / 100000
Iteration 0, loss = 0.0182
Iteration 20, loss = 0.0099
Iteration 40, loss = 0.0123
Iteration 60, loss = 0.0111
Iteration 80, loss = 0.0112
--- Epoch 984 / 100000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0242
Iteration 40, loss = 0.0183
Iteration 60, loss = 0.0204
Iteration 80, loss = 0.0129
--- Epoch 985 / 100000
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0231
Iteration 60, loss = 0.0131
Iteration 80, loss = 0.0095
--- Epoch 986 / 100000
Iteration 0, loss = 0.0265
Iteration 20, loss = 0.0164
Iteration 40, loss = 0.0102
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0257
--- Epoch 987 / 100000
Iteration 0, loss = 0.0120
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0175
Iteration 60, loss = 0.0184
Iteration 80, loss = 0.0204
--- Epoch 988 / 100000
Iteration 0, loss = 0.0160
Iteration 20, loss = 0.0065
Iteration 40, loss = 0.0157
Iteration 60, loss = 0.0279
Iteration 80, loss = 0.0277
--- Epoch 989 / 100000
Iteration 0, loss = 0.0166
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0141
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0077
--- Epoch 990 / 100000
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0169
Iteration 40, loss = 0.0243
Iteration 60, loss = 0.0243
Iteration 80, loss = 0.0210
--- Epoch 991 / 100000
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0127
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0160
Iteration 80, loss = 0.0097
--- Epoch 992 / 100000
Iteration 0, loss = 0.0101
Iteration 20, loss = 0.0232
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0208
Iteration 80, loss = 0.0174
--- Epoch 993 / 100000
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0191
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0286
Iteration 80, loss = 0.0142
--- Epoch 994 / 100000
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0231
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0171
Iteration 80, loss = 0.0198
--- Epoch 995 / 100000
Iteration 0, loss = 0.0230
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0106
--- Epoch 996 / 100000
Iteration 0, loss = 0.0186
Iteration 20, loss = 0.0146
Iteration 40, loss = 0.0227
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0102
--- Epoch 997 / 100000
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0217
Iteration 40, loss = 0.0205
Iteration 60, loss = 0.0132
Iteration 80, loss = 0.0166
--- Epoch 998 / 100000
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0124
Iteration 60, loss = 0.0128
Iteration 80, loss = 0.0206
--- Epoch 999 / 100000
Iteration 0, loss = 0.0311
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0186
Iteration 80, loss = 0.0155
--- Epoch 1000 / 100000
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0290
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0192
--- Epoch 1001 / 100000
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0215
Iteration 60, loss = 0.0121
Iteration 80, loss = 0.0172
--- Epoch 1002 / 100000
Iteration 0, loss = 0.0120
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0356
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0185
--- Epoch 1003 / 100000
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0342
Iteration 60, loss = 0.0367
Iteration 80, loss = 0.0111
--- Epoch 1004 / 100000
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0253
Iteration 40, loss = 0.0145
Iteration 60, loss = 0.0256
Iteration 80, loss = 0.0208
--- Epoch 1005 / 100000
Iteration 0, loss = 0.0097
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0170
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0220
--- Epoch 1006 / 100000
Iteration 0, loss = 0.0224
Iteration 20, loss = 0.0180
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0177
--- Epoch 1007 / 100000
Iteration 0, loss = 0.0171
Iteration 20, loss = 0.0123
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0206
Iteration 80, loss = 0.0148
--- Epoch 1008 / 100000
Iteration 0, loss = 0.0127
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0058
--- Epoch 1009 / 100000
Iteration 0, loss = 0.0196
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0144
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0138
--- Epoch 1010 / 100000
Iteration 0, loss = 0.0145
Iteration 20, loss = 0.0133
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0137
Iteration 80, loss = 0.0056
--- Epoch 1011 / 100000
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0140
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0159
Iteration 80, loss = 0.0167
--- Epoch 1012 / 100000
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0103
--- Epoch 1013 / 100000
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0230
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0103
--- Epoch 1014 / 100000
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0399
Iteration 80, loss = 0.0091
--- Epoch 1015 / 100000
Iteration 0, loss = 0.0262
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0091
--- Epoch 1016 / 100000
Iteration 0, loss = 0.0257
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0116
Iteration 80, loss = 0.0173
--- Epoch 1017 / 100000
Iteration 0, loss = 0.0145
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0108
Iteration 80, loss = 0.0136
--- Epoch 1018 / 100000
Iteration 0, loss = 0.0158
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0171
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0118
--- Epoch 1019 / 100000
Iteration 0, loss = 0.0180
Iteration 20, loss = 0.0173
Iteration 40, loss = 0.0298
Iteration 60, loss = 0.0209
Iteration 80, loss = 0.0133
--- Epoch 1020 / 100000
Iteration 0, loss = 0.0194
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0114
--- Epoch 1021 / 100000
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0177
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0302
--- Epoch 1022 / 100000
Iteration 0, loss = 0.0238
Iteration 20, loss = 0.0243
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0144
Iteration 80, loss = 0.0154
--- Epoch 1023 / 100000
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0189
Iteration 40, loss = 0.0175
Iteration 60, loss = 0.0186
Iteration 80, loss = 0.0112
--- Epoch 1024 / 100000
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0270
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0144
--- Epoch 1025 / 100000
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0139
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0222
--- Epoch 1026 / 100000
Iteration 0, loss = 0.0126
Iteration 20, loss = 0.0229
Iteration 40, loss = 0.0193
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0092
--- Epoch 1027 / 100000
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0121
--- Epoch 1028 / 100000
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0201
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0234
--- Epoch 1029 / 100000
Iteration 0, loss = 0.0183
Iteration 20, loss = 0.0203
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0185
--- Epoch 1030 / 100000
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0123
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0190
Iteration 80, loss = 0.0142
--- Epoch 1031 / 100000
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0155
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0092
--- Epoch 1032 / 100000
Iteration 0, loss = 0.0616
Iteration 20, loss = 0.0219
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0156
--- Epoch 1033 / 100000
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0169
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0248
Iteration 80, loss = 0.0202
--- Epoch 1034 / 100000
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0151
--- Epoch 1035 / 100000
Iteration 0, loss = 0.0128
Iteration 20, loss = 0.0145
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0163
--- Epoch 1036 / 100000
Iteration 0, loss = 0.0128
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0370
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0110
--- Epoch 1037 / 100000
Iteration 0, loss = 0.0128
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0193
--- Epoch 1038 / 100000
Iteration 0, loss = 0.0126
Iteration 20, loss = 0.0339
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0065
--- Epoch 1039 / 100000
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0150
--- Epoch 1040 / 100000
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0486
Iteration 60, loss = 0.0155
Iteration 80, loss = 0.0131
--- Epoch 1041 / 100000
Iteration 0, loss = 0.0223
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0176
Iteration 80, loss = 0.0164
--- Epoch 1042 / 100000
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0099
Iteration 40, loss = 0.0363
Iteration 60, loss = 0.0240
Iteration 80, loss = 0.0136
--- Epoch 1043 / 100000
Iteration 0, loss = 0.0223
Iteration 20, loss = 0.0195
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0095
--- Epoch 1044 / 100000
Iteration 0, loss = 0.0170
Iteration 20, loss = 0.0146
Iteration 40, loss = 0.0293
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0157
--- Epoch 1045 / 100000
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0192
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0153
Iteration 80, loss = 0.0251
--- Epoch 1046 / 100000
Iteration 0, loss = 0.0356
Iteration 20, loss = 0.0233
Iteration 40, loss = 0.0134
Iteration 60, loss = 0.0160
Iteration 80, loss = 0.0074
--- Epoch 1047 / 100000
Iteration 0, loss = 0.0251
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0217
Iteration 80, loss = 0.0072
--- Epoch 1048 / 100000
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0172
--- Epoch 1049 / 100000
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0128
--- Epoch 1050 / 100000
Iteration 0, loss = 0.0101
Iteration 20, loss = 0.0145
Iteration 40, loss = 0.0258
Iteration 60, loss = 0.0447
Iteration 80, loss = 0.0154
--- Epoch 1051 / 100000
Iteration 0, loss = 0.0173
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0113
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0176
--- Epoch 1052 / 100000
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0158
Iteration 60, loss = 0.0193
Iteration 80, loss = 0.0452
--- Epoch 1053 / 100000
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0213
Iteration 60, loss = 0.0350
Iteration 80, loss = 0.0130
--- Epoch 1054 / 100000
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0113
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0227
--- Epoch 1055 / 100000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0108
Iteration 80, loss = 0.0111
--- Epoch 1056 / 100000
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0254
Iteration 60, loss = 0.0164
Iteration 80, loss = 0.0139
--- Epoch 1057 / 100000
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0189
Iteration 40, loss = 0.0152
Iteration 60, loss = 0.0159
Iteration 80, loss = 0.0146
--- Epoch 1058 / 100000
Iteration 0, loss = 0.0163
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0123
Iteration 60, loss = 0.0249
Iteration 80, loss = 0.0176
--- Epoch 1059 / 100000
Iteration 0, loss = 0.0183
Iteration 20, loss = 0.0172
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0111
--- Epoch 1060 / 100000
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0155
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0172
Iteration 80, loss = 0.0152
--- Epoch 1061 / 100000
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0132
Iteration 40, loss = 0.0358
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0160
--- Epoch 1062 / 100000
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0175
Iteration 40, loss = 0.0189
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0175
--- Epoch 1063 / 100000
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0325
Iteration 80, loss = 0.0151
--- Epoch 1064 / 100000
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0092
--- Epoch 1065 / 100000
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0364
Iteration 40, loss = 0.0164
Iteration 60, loss = 0.0320
Iteration 80, loss = 0.0161
--- Epoch 1066 / 100000
Iteration 0, loss = 0.0109
Iteration 20, loss = 0.0115
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0145
Iteration 80, loss = 0.0118
--- Epoch 1067 / 100000
Iteration 0, loss = 0.0137
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0282
Iteration 60, loss = 0.0182
Iteration 80, loss = 0.0304
--- Epoch 1068 / 100000
Iteration 0, loss = 0.0222
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0125
--- Epoch 1069 / 100000
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0111
--- Epoch 1070 / 100000
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0124
Iteration 40, loss = 0.0147
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0109
--- Epoch 1071 / 100000
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0243
Iteration 40, loss = 0.0195
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0114
--- Epoch 1072 / 100000
Iteration 0, loss = 0.0212
Iteration 20, loss = 0.0195
Iteration 40, loss = 0.0289
Iteration 60, loss = 0.0142
Iteration 80, loss = 0.0092
--- Epoch 1073 / 100000
Iteration 0, loss = 0.0333
Iteration 20, loss = 0.0151
Iteration 40, loss = 0.0102
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0087
--- Epoch 1074 / 100000
Iteration 0, loss = 0.0191
Iteration 20, loss = 0.0132
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0273
Iteration 80, loss = 0.0116
--- Epoch 1075 / 100000
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0135
--- Epoch 1076 / 100000
Iteration 0, loss = 0.0130
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0117
--- Epoch 1077 / 100000
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0115
Iteration 40, loss = 0.0162
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0171
--- Epoch 1078 / 100000
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0108
Iteration 40, loss = 0.0240
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0177
--- Epoch 1079 / 100000
Iteration 0, loss = 0.0229
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0134
Iteration 60, loss = 0.0176
Iteration 80, loss = 0.0114
--- Epoch 1080 / 100000
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0186
--- Epoch 1081 / 100000
Iteration 0, loss = 0.0178
Iteration 20, loss = 0.0237
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0126
--- Epoch 1082 / 100000
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0138
Iteration 80, loss = 0.0148
--- Epoch 1083 / 100000
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0082
--- Epoch 1084 / 100000
Iteration 0, loss = 0.0150
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0078
--- Epoch 1085 / 100000
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0148
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0175
--- Epoch 1086 / 100000
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0156
Iteration 80, loss = 0.0126
--- Epoch 1087 / 100000
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0148
Iteration 40, loss = 0.0201
Iteration 60, loss = 0.0123
Iteration 80, loss = 0.0108
--- Epoch 1088 / 100000
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0205
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0145
Iteration 80, loss = 0.0131
--- Epoch 1089 / 100000
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0166
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0069
--- Epoch 1090 / 100000
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0094
--- Epoch 1091 / 100000
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0147
Iteration 40, loss = 0.0159
Iteration 60, loss = 0.0198
Iteration 80, loss = 0.0114
--- Epoch 1092 / 100000
Iteration 0, loss = 0.0153
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0155
Iteration 60, loss = 0.0219
Iteration 80, loss = 0.0133
--- Epoch 1093 / 100000
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0179
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0168
--- Epoch 1094 / 100000
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0167
Iteration 40, loss = 0.0246
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0263
--- Epoch 1095 / 100000
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0201
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0116
--- Epoch 1096 / 100000
Iteration 0, loss = 0.0136
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0196
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0109
--- Epoch 1097 / 100000
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0358
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0254
Iteration 80, loss = 0.0072
--- Epoch 1098 / 100000
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0145
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0222
--- Epoch 1099 / 100000
Iteration 0, loss = 0.0183
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0142
Iteration 80, loss = 0.0136
--- Epoch 1100 / 100000
Iteration 0, loss = 0.0130
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0218
Iteration 60, loss = 0.0134
Iteration 80, loss = 0.0147
--- Epoch 1101 / 100000
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0133
Iteration 80, loss = 0.0095
--- Epoch 1102 / 100000
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0094
--- Epoch 1103 / 100000
Iteration 0, loss = 0.0174
Iteration 20, loss = 0.0161
Iteration 40, loss = 0.0147
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0116
--- Epoch 1104 / 100000
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0131
Iteration 60, loss = 0.0131
Iteration 80, loss = 0.0122
--- Epoch 1105 / 100000
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0097
Iteration 80, loss = 0.0138
--- Epoch 1106 / 100000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0096
--- Epoch 1107 / 100000
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0167
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0108
--- Epoch 1108 / 100000
Iteration 0, loss = 0.0205
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0260
Iteration 60, loss = 0.0229
Iteration 80, loss = 0.0131
--- Epoch 1109 / 100000
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0136
--- Epoch 1110 / 100000
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0086
Iteration 40, loss = 0.0283
Iteration 60, loss = 0.0155
Iteration 80, loss = 0.0115
--- Epoch 1111 / 100000
Iteration 0, loss = 0.0083
Iteration 20, loss = 0.0144
Iteration 40, loss = 0.0135
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0128
--- Epoch 1112 / 100000
Iteration 0, loss = 0.0210
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0096
--- Epoch 1113 / 100000
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0210
Iteration 40, loss = 0.0228
Iteration 60, loss = 0.0214
Iteration 80, loss = 0.0114
--- Epoch 1114 / 100000
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0206
Iteration 80, loss = 0.0201
--- Epoch 1115 / 100000
Iteration 0, loss = 0.0251
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0231
Iteration 60, loss = 0.0194
Iteration 80, loss = 0.0142
--- Epoch 1116 / 100000
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0210
Iteration 40, loss = 0.0369
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0231
--- Epoch 1117 / 100000
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0087
--- Epoch 1118 / 100000
Iteration 0, loss = 0.0450
Iteration 20, loss = 0.0223
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0152
--- Epoch 1119 / 100000
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0127
Iteration 40, loss = 0.0167
Iteration 60, loss = 0.0151
Iteration 80, loss = 0.0093
--- Epoch 1120 / 100000
Iteration 0, loss = 0.0127
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0173
Iteration 80, loss = 0.0099
--- Epoch 1121 / 100000
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0136
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0100
--- Epoch 1122 / 100000
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0231
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0148
--- Epoch 1123 / 100000
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0086
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0115
Iteration 80, loss = 0.0082
--- Epoch 1124 / 100000
Iteration 0, loss = 0.0179
Iteration 20, loss = 0.0603
Iteration 40, loss = 0.0078
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0412
--- Epoch 1125 / 100000
Iteration 0, loss = 0.0225
Iteration 20, loss = 0.0148
Iteration 40, loss = 0.0145
Iteration 60, loss = 0.0223
Iteration 80, loss = 0.0112
--- Epoch 1126 / 100000
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0165
Iteration 80, loss = 0.0098
--- Epoch 1127 / 100000
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0161
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0243
--- Epoch 1128 / 100000
Iteration 0, loss = 0.0263
Iteration 20, loss = 0.0144
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0156
--- Epoch 1129 / 100000
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0173
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0120
Iteration 80, loss = 0.0224
---------------------------------------------------------------------------
KeyboardInterrupt                         Traceback (most recent call last)
<ipython-input-561-b24253d770e1> in <module>
----> 1 train(model8, optimizer, epochs=100000, x_train=data["X_train_class"],  y_train=data["y_train_class"], criterion=nn.MSELoss())

<ipython-input-502-f8fe1643891d> in train(model, optimizer, epochs, x_train, y_train, criterion)
     27             y = y_batch[t].to(device=device, dtype=dtype)
     28 
---> 29             scores = model(x)
     30 
     31             loss = criterion(scores.view(-1), y.view(-1))

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/module.py in _call_impl(self, *input, **kwargs)
    720             result = self._slow_forward(*input, **kwargs)
    721         else:
--> 722             result = self.forward(*input, **kwargs)
    723         for hook in itertools.chain(
    724                 _global_forward_hooks.values(),

<ipython-input-559-1454e4041bce> in forward(self, x)
     35         scores = F.relu(self.batchnorm6(self.conv6(scores)))
     36         scores = self.upsample(scores)
---> 37         scores = torch.tanh(self.conv7(scores))
     38 
     39 #         with_x = torch.cat((scores.view(-1), x.view(-1)), 0)

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/module.py in _call_impl(self, *input, **kwargs)
    720             result = self._slow_forward(*input, **kwargs)
    721         else:
--> 722             result = self.forward(*input, **kwargs)
    723         for hook in itertools.chain(
    724                 _global_forward_hooks.values(),

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/conv.py in forward(self, input)
    417 
    418     def forward(self, input: Tensor) -> Tensor:
--> 419         return self._conv_forward(input, self.weight)
    420 
    421 class Conv3d(_ConvNd):

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/conv.py in _conv_forward(self, input, weight)
    414                             _pair(0), self.dilation, self.groups)
    415         return F.conv2d(input, weight, self.bias, self.stride,
--> 416                         self.padding, self.dilation, self.groups)
    417 
    418     def forward(self, input: Tensor) -> Tensor:

KeyboardInterrupt: 
In [562]:
testModel(model8, x_test=data["X_test_class"], y_test=data["y_test_class"], criterion=nn.L1Loss())
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
In [24]:
class ConvNet4(nn.Module):
    def __init__(self):
        super().__init__()
        self.epochsTrained = 0
     
        self.batchnorm1 = nn.BatchNorm2d(32)
        self.batchnorm2 = nn.BatchNorm2d(64)
        self.batchnorm3 = nn.BatchNorm2d(128)
        self.batchnorm4 = nn.BatchNorm2d(128)
        self.batchnorm5 = nn.BatchNorm2d(64)
        self.batchnorm6 = nn.BatchNorm2d(32)
          
        self.upsample = nn.Upsample(scale_factor=2, mode='bilinear')
              
        self.conv1 = nn.Conv2d(1, 32, kernel_size=3, padding=1) 
        self.conv2 = nn.Conv2d(32, 64, kernel_size=3, stride=2, padding=1) 
        self.conv3 = nn.Conv2d(64, 128, kernel_size=3, stride=2, padding=1)
        self.conv4 = nn.Conv2d(128, 128, kernel_size=3, stride=2, padding=1) 
        self.conv5 = nn.Conv2d(128, 64, kernel_size=3, padding=1)
        self.conv6 = nn.Conv2d(64, 32, kernel_size=3, padding=1)
        self.conv7 = nn.Conv2d(32, 3, kernel_size=3, padding=1)
     
    def forward(self, x):
        x = x[0, :, :].unsqueeze(0).unsqueeze(0)
          
        # Encoder
        scores = F.relu(self.batchnorm1(self.conv1(x)))
        scores = F.relu(self.batchnorm2(self.conv2(scores)))
        scores = F.relu(self.batchnorm3(self.conv3(scores)))
        scores = F.relu(self.batchnorm4(self.conv4(scores)))
     
        # Decoder
        scores = self.upsample(scores)
        scores = F.relu(self.batchnorm5(self.conv5(scores)))
        scores = self.upsample(scores)
        scores = F.relu(self.batchnorm6(self.conv6(scores)))
        scores = self.upsample(scores)
          
        # Add x so scores so network is better learning how to color x but not the structure of x
        scores = (torch.tanh(self.conv7(scores)) + x)
     
        # Normalize between 0-1
        scores = scores.view(-1)
        scores = (scores - torch.min(scores)) / (torch.max(scores) - torch.min(scores))

        return scores
In [116]:
learning_rate = 1e-2
model9 = ConvNet4()
optimizer = optim.SGD(model9.parameters(), lr=learning_rate)
In [117]:
train(model9, optimizer, epochs=2000, x_train=data["X_train_ship"],  y_train=data["y_train_ship"], criterion=nn.MSELoss())
--- Epoch 1 / 2000 - 1 epochs total
Iteration 0, loss = 0.0564
Iteration 20, loss = 0.0359
Iteration 40, loss = 0.0359
Iteration 60, loss = 0.0223
Iteration 80, loss = 0.0284
--- Epoch 2 / 2000 - 2 epochs total
Iteration 0, loss = 0.0162
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0427
Iteration 60, loss = 0.0245
Iteration 80, loss = 0.0186
--- Epoch 3 / 2000 - 3 epochs total
Iteration 0, loss = 0.0228
Iteration 20, loss = 0.0115
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0230
Iteration 80, loss = 0.0183
--- Epoch 4 / 2000 - 4 epochs total
Iteration 0, loss = 0.0417
Iteration 20, loss = 0.0443
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0161
Iteration 80, loss = 0.0675
--- Epoch 5 / 2000 - 5 epochs total
Iteration 0, loss = 0.0193
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0118
--- Epoch 6 / 2000 - 6 epochs total
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0150
Iteration 80, loss = 0.0076
--- Epoch 7 / 2000 - 7 epochs total
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0180
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0143
--- Epoch 8 / 2000 - 8 epochs total
Iteration 0, loss = 0.0219
Iteration 20, loss = 0.0189
Iteration 40, loss = 0.0318
Iteration 60, loss = 0.0157
Iteration 80, loss = 0.0137
--- Epoch 9 / 2000 - 9 epochs total
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0164
--- Epoch 10 / 2000 - 10 epochs total
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0291
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0121
--- Epoch 11 / 2000 - 11 epochs total
Iteration 0, loss = 0.0314
Iteration 20, loss = 0.0170
Iteration 40, loss = 0.0447
Iteration 60, loss = 0.0097
Iteration 80, loss = 0.0070
--- Epoch 12 / 2000 - 12 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0288
Iteration 40, loss = 0.0146
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0117
--- Epoch 13 / 2000 - 13 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0363
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0129
--- Epoch 14 / 2000 - 14 epochs total
Iteration 0, loss = 0.0284
Iteration 20, loss = 0.0206
Iteration 40, loss = 0.0195
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0171
--- Epoch 15 / 2000 - 15 epochs total
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0159
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0078
--- Epoch 16 / 2000 - 16 epochs total
Iteration 0, loss = 0.0404
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0205
Iteration 60, loss = 0.0150
Iteration 80, loss = 0.0126
--- Epoch 17 / 2000 - 17 epochs total
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0241
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0048
--- Epoch 18 / 2000 - 18 epochs total
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0474
Iteration 80, loss = 0.0116
--- Epoch 19 / 2000 - 19 epochs total
Iteration 0, loss = 0.0165
Iteration 20, loss = 0.0065
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0123
Iteration 80, loss = 0.0031
--- Epoch 20 / 2000 - 20 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0129
Iteration 40, loss = 0.0344
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0090
--- Epoch 21 / 2000 - 21 epochs total
Iteration 0, loss = 0.0123
Iteration 20, loss = 0.0127
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0162
--- Epoch 22 / 2000 - 22 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0232
Iteration 40, loss = 0.0385
Iteration 60, loss = 0.0295
Iteration 80, loss = 0.0122
--- Epoch 23 / 2000 - 23 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0088
--- Epoch 24 / 2000 - 24 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0067
--- Epoch 25 / 2000 - 25 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0274
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0073
--- Epoch 26 / 2000 - 26 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0228
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0054
--- Epoch 27 / 2000 - 27 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0269
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0092
--- Epoch 28 / 2000 - 28 epochs total
Iteration 0, loss = 0.0265
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0195
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0057
--- Epoch 29 / 2000 - 29 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0031
--- Epoch 30 / 2000 - 30 epochs total
Iteration 0, loss = 0.0582
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0110
--- Epoch 31 / 2000 - 31 epochs total
Iteration 0, loss = 0.0164
Iteration 20, loss = 0.0115
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0085
--- Epoch 32 / 2000 - 32 epochs total
Iteration 0, loss = 0.0204
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0302
Iteration 80, loss = 0.0062
--- Epoch 33 / 2000 - 33 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0237
Iteration 80, loss = 0.0166
--- Epoch 34 / 2000 - 34 epochs total
Iteration 0, loss = 0.0193
Iteration 20, loss = 0.0124
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0445
--- Epoch 35 / 2000 - 35 epochs total
Iteration 0, loss = 0.0220
Iteration 20, loss = 0.0163
Iteration 40, loss = 0.0137
Iteration 60, loss = 0.0138
Iteration 80, loss = 0.0321
--- Epoch 36 / 2000 - 36 epochs total
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0184
Iteration 80, loss = 0.0370
--- Epoch 37 / 2000 - 37 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0133
Iteration 80, loss = 0.0047
--- Epoch 38 / 2000 - 38 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0053
--- Epoch 39 / 2000 - 39 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0248
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0072
--- Epoch 40 / 2000 - 40 epochs total
Iteration 0, loss = 0.0161
Iteration 20, loss = 0.0115
Iteration 40, loss = 0.0129
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0062
--- Epoch 41 / 2000 - 41 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0171
--- Epoch 42 / 2000 - 42 epochs total
Iteration 0, loss = 0.0165
Iteration 20, loss = 0.0161
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0244
Iteration 80, loss = 0.0444
--- Epoch 43 / 2000 - 43 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0102
--- Epoch 44 / 2000 - 44 epochs total
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0303
--- Epoch 45 / 2000 - 45 epochs total
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0132
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0096
--- Epoch 46 / 2000 - 46 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0131
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0088
--- Epoch 47 / 2000 - 47 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0057
--- Epoch 48 / 2000 - 48 epochs total
Iteration 0, loss = 0.0211
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0137
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0190
--- Epoch 49 / 2000 - 49 epochs total
Iteration 0, loss = 0.0319
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0083
--- Epoch 50 / 2000 - 50 epochs total
Iteration 0, loss = 0.0193
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0141
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0136
--- Epoch 51 / 2000 - 51 epochs total
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0073
--- Epoch 52 / 2000 - 52 epochs total
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0284
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0096
--- Epoch 53 / 2000 - 53 epochs total
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0175
Iteration 40, loss = 0.0256
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0058
--- Epoch 54 / 2000 - 54 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0241
Iteration 80, loss = 0.0128
--- Epoch 55 / 2000 - 55 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0190
Iteration 60, loss = 0.0210
Iteration 80, loss = 0.0077
--- Epoch 56 / 2000 - 56 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0176
Iteration 60, loss = 0.0132
Iteration 80, loss = 0.0115
--- Epoch 57 / 2000 - 57 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0269
Iteration 40, loss = 0.0227
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0153
--- Epoch 58 / 2000 - 58 epochs total
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0265
Iteration 60, loss = 0.0177
Iteration 80, loss = 0.0043
--- Epoch 59 / 2000 - 59 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0258
Iteration 60, loss = 0.0238
Iteration 80, loss = 0.0057
--- Epoch 60 / 2000 - 60 epochs total
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0169
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0181
Iteration 80, loss = 0.0071
--- Epoch 61 / 2000 - 61 epochs total
Iteration 0, loss = 0.0338
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0150
Iteration 80, loss = 0.0029
--- Epoch 62 / 2000 - 62 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0201
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0049
--- Epoch 63 / 2000 - 63 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0057
--- Epoch 64 / 2000 - 64 epochs total
Iteration 0, loss = 0.0446
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0071
--- Epoch 65 / 2000 - 65 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0151
Iteration 80, loss = 0.0065
--- Epoch 66 / 2000 - 66 epochs total
Iteration 0, loss = 0.0235
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0209
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0046
--- Epoch 67 / 2000 - 67 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0250
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0177
Iteration 80, loss = 0.0058
--- Epoch 68 / 2000 - 68 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0145
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0139
--- Epoch 69 / 2000 - 69 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0207
Iteration 40, loss = 0.0200
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0352
--- Epoch 70 / 2000 - 70 epochs total
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0052
--- Epoch 71 / 2000 - 71 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0101
--- Epoch 72 / 2000 - 72 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0168
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0076
--- Epoch 73 / 2000 - 73 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0105
Iteration 60, loss = 0.0201
Iteration 80, loss = 0.0107
--- Epoch 74 / 2000 - 74 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0120
Iteration 80, loss = 0.0086
--- Epoch 75 / 2000 - 75 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0053
--- Epoch 76 / 2000 - 76 epochs total
Iteration 0, loss = 0.0319
Iteration 20, loss = 0.0192
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0030
--- Epoch 77 / 2000 - 77 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0133
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0063
--- Epoch 78 / 2000 - 78 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0041
--- Epoch 79 / 2000 - 79 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0205
Iteration 40, loss = 0.0178
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0030
--- Epoch 80 / 2000 - 80 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0156
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0170
Iteration 80, loss = 0.0073
--- Epoch 81 / 2000 - 81 epochs total
Iteration 0, loss = 0.0282
Iteration 20, loss = 0.0254
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0238
--- Epoch 82 / 2000 - 82 epochs total
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0094
--- Epoch 83 / 2000 - 83 epochs total
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0501
Iteration 60, loss = 0.0137
Iteration 80, loss = 0.0133
--- Epoch 84 / 2000 - 84 epochs total
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0206
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0200
--- Epoch 85 / 2000 - 85 epochs total
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0155
Iteration 80, loss = 0.0037
--- Epoch 86 / 2000 - 86 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0185
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0184
--- Epoch 87 / 2000 - 87 epochs total
Iteration 0, loss = 0.0083
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0150
--- Epoch 88 / 2000 - 88 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0156
--- Epoch 89 / 2000 - 89 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0054
--- Epoch 90 / 2000 - 90 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0218
--- Epoch 91 / 2000 - 91 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0266
--- Epoch 92 / 2000 - 92 epochs total
Iteration 0, loss = 0.0130
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0142
Iteration 80, loss = 0.0377
--- Epoch 93 / 2000 - 93 epochs total
Iteration 0, loss = 0.0205
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0036
--- Epoch 94 / 2000 - 94 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0365
Iteration 60, loss = 0.0136
Iteration 80, loss = 0.0058
--- Epoch 95 / 2000 - 95 epochs total
Iteration 0, loss = 0.0229
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0121
Iteration 60, loss = 0.0134
Iteration 80, loss = 0.0080
--- Epoch 96 / 2000 - 96 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0078
--- Epoch 97 / 2000 - 97 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0129
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0093
--- Epoch 98 / 2000 - 98 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0215
--- Epoch 99 / 2000 - 99 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0218
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0083
--- Epoch 100 / 2000 - 100 epochs total
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0174
Iteration 80, loss = 0.0322
--- Epoch 101 / 2000 - 101 epochs total
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0409
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0057
--- Epoch 102 / 2000 - 102 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0033
--- Epoch 103 / 2000 - 103 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0067
--- Epoch 104 / 2000 - 104 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0191
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0058
--- Epoch 105 / 2000 - 105 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0111
Iteration 80, loss = 0.0038
--- Epoch 106 / 2000 - 106 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0363
--- Epoch 107 / 2000 - 107 epochs total
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0112
--- Epoch 108 / 2000 - 108 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0319
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0053
--- Epoch 109 / 2000 - 109 epochs total
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0127
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.1290
Iteration 80, loss = 0.0030
--- Epoch 110 / 2000 - 110 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0058
--- Epoch 111 / 2000 - 111 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0305
Iteration 80, loss = 0.0321
--- Epoch 112 / 2000 - 112 epochs total
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0044
--- Epoch 113 / 2000 - 113 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0095
--- Epoch 114 / 2000 - 114 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0121
--- Epoch 115 / 2000 - 115 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0191
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0027
--- Epoch 116 / 2000 - 116 epochs total
Iteration 0, loss = 0.0372
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0109
--- Epoch 117 / 2000 - 117 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0041
--- Epoch 118 / 2000 - 118 epochs total
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0029
--- Epoch 119 / 2000 - 119 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0243
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0115
Iteration 80, loss = 0.0041
--- Epoch 120 / 2000 - 120 epochs total
Iteration 0, loss = 0.0162
Iteration 20, loss = 0.0154
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0131
--- Epoch 121 / 2000 - 121 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0437
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0088
--- Epoch 122 / 2000 - 122 epochs total
Iteration 0, loss = 0.0084
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0282
--- Epoch 123 / 2000 - 123 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0145
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0166
Iteration 80, loss = 0.0129
--- Epoch 124 / 2000 - 124 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0232
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0292
Iteration 80, loss = 0.0126
--- Epoch 125 / 2000 - 125 epochs total
Iteration 0, loss = 0.0266
Iteration 20, loss = 0.0246
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0014
--- Epoch 126 / 2000 - 126 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0087
--- Epoch 127 / 2000 - 127 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0328
--- Epoch 128 / 2000 - 128 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0015
--- Epoch 129 / 2000 - 129 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0144
--- Epoch 130 / 2000 - 130 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0022
--- Epoch 131 / 2000 - 131 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0035
--- Epoch 132 / 2000 - 132 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0121
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0054
--- Epoch 133 / 2000 - 133 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0151
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0111
--- Epoch 134 / 2000 - 134 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0050
--- Epoch 135 / 2000 - 135 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0147
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0244
Iteration 80, loss = 0.0012
--- Epoch 136 / 2000 - 136 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0038
--- Epoch 137 / 2000 - 137 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0030
--- Epoch 138 / 2000 - 138 epochs total
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0141
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0046
--- Epoch 139 / 2000 - 139 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0108
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0020
--- Epoch 140 / 2000 - 140 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0020
--- Epoch 141 / 2000 - 141 epochs total
Iteration 0, loss = 0.0151
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0057
--- Epoch 142 / 2000 - 142 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0167
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0096
--- Epoch 143 / 2000 - 143 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0031
--- Epoch 144 / 2000 - 144 epochs total
Iteration 0, loss = 0.0203
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0025
--- Epoch 145 / 2000 - 145 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0215
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0049
--- Epoch 146 / 2000 - 146 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0167
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0014
--- Epoch 147 / 2000 - 147 epochs total
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0142
--- Epoch 148 / 2000 - 148 epochs total
Iteration 0, loss = 0.0282
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0082
--- Epoch 149 / 2000 - 149 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0033
--- Epoch 150 / 2000 - 150 epochs total
Iteration 0, loss = 0.0227
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0014
--- Epoch 151 / 2000 - 151 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0136
Iteration 40, loss = 0.0652
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0056
--- Epoch 152 / 2000 - 152 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0182
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0088
--- Epoch 153 / 2000 - 153 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0205
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0254
Iteration 80, loss = 0.0312
--- Epoch 154 / 2000 - 154 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0051
--- Epoch 155 / 2000 - 155 epochs total
Iteration 0, loss = 0.0169
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0093
--- Epoch 156 / 2000 - 156 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0117
--- Epoch 157 / 2000 - 157 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0034
--- Epoch 158 / 2000 - 158 epochs total
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0083
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0060
--- Epoch 159 / 2000 - 159 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0325
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0030
--- Epoch 160 / 2000 - 160 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0047
--- Epoch 161 / 2000 - 161 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0189
--- Epoch 162 / 2000 - 162 epochs total
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0119
--- Epoch 163 / 2000 - 163 epochs total
Iteration 0, loss = 0.0136
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0034
--- Epoch 164 / 2000 - 164 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0091
--- Epoch 165 / 2000 - 165 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0394
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0294
--- Epoch 166 / 2000 - 166 epochs total
Iteration 0, loss = 0.0340
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0189
Iteration 60, loss = 0.0174
Iteration 80, loss = 0.0036
--- Epoch 167 / 2000 - 167 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0203
Iteration 40, loss = 0.0139
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0217
--- Epoch 168 / 2000 - 168 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0046
--- Epoch 169 / 2000 - 169 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0231
--- Epoch 170 / 2000 - 170 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0165
Iteration 80, loss = 0.0018
--- Epoch 171 / 2000 - 171 epochs total
Iteration 0, loss = 0.0164
Iteration 20, loss = 0.0182
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0150
Iteration 80, loss = 0.0143
--- Epoch 172 / 2000 - 172 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0237
Iteration 80, loss = 0.0095
--- Epoch 173 / 2000 - 173 epochs total
Iteration 0, loss = 0.0399
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0055
--- Epoch 174 / 2000 - 174 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0138
Iteration 80, loss = 0.0045
--- Epoch 175 / 2000 - 175 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0247
--- Epoch 176 / 2000 - 176 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0041
--- Epoch 177 / 2000 - 177 epochs total
Iteration 0, loss = 0.0181
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0025
--- Epoch 178 / 2000 - 178 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0042
--- Epoch 179 / 2000 - 179 epochs total
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0316
--- Epoch 180 / 2000 - 180 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0037
--- Epoch 181 / 2000 - 181 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0023
--- Epoch 182 / 2000 - 182 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0092
--- Epoch 183 / 2000 - 183 epochs total
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0112
--- Epoch 184 / 2000 - 184 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0062
--- Epoch 185 / 2000 - 185 epochs total
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0046
--- Epoch 186 / 2000 - 186 epochs total
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0325
Iteration 80, loss = 0.0009
--- Epoch 187 / 2000 - 187 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0046
--- Epoch 188 / 2000 - 188 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0320
Iteration 80, loss = 0.0042
--- Epoch 189 / 2000 - 189 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0152
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0023
--- Epoch 190 / 2000 - 190 epochs total
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0151
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0158
Iteration 80, loss = 0.0042
--- Epoch 191 / 2000 - 191 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0182
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0053
--- Epoch 192 / 2000 - 192 epochs total
Iteration 0, loss = 0.0200
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0119
--- Epoch 193 / 2000 - 193 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0245
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0019
--- Epoch 194 / 2000 - 194 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0026
--- Epoch 195 / 2000 - 195 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0042
--- Epoch 196 / 2000 - 196 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0169
Iteration 80, loss = 0.0418
--- Epoch 197 / 2000 - 197 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0036
--- Epoch 198 / 2000 - 198 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0128
--- Epoch 199 / 2000 - 199 epochs total
Iteration 0, loss = 0.0221
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0050
--- Epoch 200 / 2000 - 200 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0144
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0020
--- Epoch 201 / 2000 - 201 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0138
--- Epoch 202 / 2000 - 202 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0266
Iteration 80, loss = 0.0028
--- Epoch 203 / 2000 - 203 epochs total
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0226
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0169
--- Epoch 204 / 2000 - 204 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0018
--- Epoch 205 / 2000 - 205 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0031
--- Epoch 206 / 2000 - 206 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0059
--- Epoch 207 / 2000 - 207 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0390
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0049
--- Epoch 208 / 2000 - 208 epochs total
Iteration 0, loss = 0.0131
Iteration 20, loss = 0.0151
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0021
--- Epoch 209 / 2000 - 209 epochs total
Iteration 0, loss = 0.0101
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0046
--- Epoch 210 / 2000 - 210 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0180
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0121
--- Epoch 211 / 2000 - 211 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0083
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0021
--- Epoch 212 / 2000 - 212 epochs total
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0070
--- Epoch 213 / 2000 - 213 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0102
--- Epoch 214 / 2000 - 214 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0345
Iteration 40, loss = 0.0155
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0027
--- Epoch 215 / 2000 - 215 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0176
Iteration 80, loss = 0.0087
--- Epoch 216 / 2000 - 216 epochs total
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0277
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0053
--- Epoch 217 / 2000 - 217 epochs total
Iteration 0, loss = 0.0084
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0052
--- Epoch 218 / 2000 - 218 epochs total
Iteration 0, loss = 0.0360
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0035
--- Epoch 219 / 2000 - 219 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0191
Iteration 60, loss = 0.0116
Iteration 80, loss = 0.0045
--- Epoch 220 / 2000 - 220 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0020
--- Epoch 221 / 2000 - 221 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0018
--- Epoch 222 / 2000 - 222 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0123
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0069
--- Epoch 223 / 2000 - 223 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0048
--- Epoch 224 / 2000 - 224 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0051
--- Epoch 225 / 2000 - 225 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0017
--- Epoch 226 / 2000 - 226 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0124
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0077
--- Epoch 227 / 2000 - 227 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0052
--- Epoch 228 / 2000 - 228 epochs total
Iteration 0, loss = 0.0213
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0078
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0060
--- Epoch 229 / 2000 - 229 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0059
--- Epoch 230 / 2000 - 230 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0099
--- Epoch 231 / 2000 - 231 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0477
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0081
--- Epoch 232 / 2000 - 232 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0062
--- Epoch 233 / 2000 - 233 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0047
--- Epoch 234 / 2000 - 234 epochs total
Iteration 0, loss = 0.0187
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0051
--- Epoch 235 / 2000 - 235 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0062
--- Epoch 236 / 2000 - 236 epochs total
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0147
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0023
--- Epoch 237 / 2000 - 237 epochs total
Iteration 0, loss = 0.0237
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0065
--- Epoch 238 / 2000 - 238 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0039
--- Epoch 239 / 2000 - 239 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0280
Iteration 80, loss = 0.0061
--- Epoch 240 / 2000 - 240 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0025
--- Epoch 241 / 2000 - 241 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0051
--- Epoch 242 / 2000 - 242 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0217
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0034
--- Epoch 243 / 2000 - 243 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0065
--- Epoch 244 / 2000 - 244 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0089
--- Epoch 245 / 2000 - 245 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0025
--- Epoch 246 / 2000 - 246 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0070
--- Epoch 247 / 2000 - 247 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0118
--- Epoch 248 / 2000 - 248 epochs total
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0061
--- Epoch 249 / 2000 - 249 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0024
--- Epoch 250 / 2000 - 250 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0165
--- Epoch 251 / 2000 - 251 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0153
Iteration 80, loss = 0.0070
--- Epoch 252 / 2000 - 252 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0058
--- Epoch 253 / 2000 - 253 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0049
--- Epoch 254 / 2000 - 254 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0326
Iteration 60, loss = 0.0132
Iteration 80, loss = 0.0076
--- Epoch 255 / 2000 - 255 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0032
--- Epoch 256 / 2000 - 256 epochs total
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0184
--- Epoch 257 / 2000 - 257 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0042
--- Epoch 258 / 2000 - 258 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0071
--- Epoch 259 / 2000 - 259 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0190
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0062
--- Epoch 260 / 2000 - 260 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0097
--- Epoch 261 / 2000 - 261 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0073
--- Epoch 262 / 2000 - 262 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0041
--- Epoch 263 / 2000 - 263 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0221
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0036
--- Epoch 264 / 2000 - 264 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0026
--- Epoch 265 / 2000 - 265 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0009
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0099
--- Epoch 266 / 2000 - 266 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0176
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0091
--- Epoch 267 / 2000 - 267 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0129
--- Epoch 268 / 2000 - 268 epochs total
Iteration 0, loss = 0.0185
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0103
--- Epoch 269 / 2000 - 269 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0134
Iteration 80, loss = 0.0060
--- Epoch 270 / 2000 - 270 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0045
--- Epoch 271 / 2000 - 271 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0020
--- Epoch 272 / 2000 - 272 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0075
--- Epoch 273 / 2000 - 273 epochs total
Iteration 0, loss = 0.0205
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0035
--- Epoch 274 / 2000 - 274 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0089
--- Epoch 275 / 2000 - 275 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0026
--- Epoch 276 / 2000 - 276 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0109
--- Epoch 277 / 2000 - 277 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0065
--- Epoch 278 / 2000 - 278 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0134
Iteration 60, loss = 0.0120
Iteration 80, loss = 0.0341
--- Epoch 279 / 2000 - 279 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0139
--- Epoch 280 / 2000 - 280 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0023
--- Epoch 281 / 2000 - 281 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0043
--- Epoch 282 / 2000 - 282 epochs total
Iteration 0, loss = 0.0128
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0206
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0040
--- Epoch 283 / 2000 - 283 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0122
--- Epoch 284 / 2000 - 284 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0403
--- Epoch 285 / 2000 - 285 epochs total
Iteration 0, loss = 0.0198
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0106
--- Epoch 286 / 2000 - 286 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0090
--- Epoch 287 / 2000 - 287 epochs total
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0323
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0070
--- Epoch 288 / 2000 - 288 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0233
Iteration 80, loss = 0.0013
--- Epoch 289 / 2000 - 289 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0014
--- Epoch 290 / 2000 - 290 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0037
--- Epoch 291 / 2000 - 291 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0052
--- Epoch 292 / 2000 - 292 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0298
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0096
--- Epoch 293 / 2000 - 293 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0154
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0050
--- Epoch 294 / 2000 - 294 epochs total
Iteration 0, loss = 0.0101
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0200
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0015
--- Epoch 295 / 2000 - 295 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0256
Iteration 80, loss = 0.0050
--- Epoch 296 / 2000 - 296 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0373
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0045
--- Epoch 297 / 2000 - 297 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0174
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0089
--- Epoch 298 / 2000 - 298 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0075
--- Epoch 299 / 2000 - 299 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0226
Iteration 80, loss = 0.0057
--- Epoch 300 / 2000 - 300 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0053
--- Epoch 301 / 2000 - 301 epochs total
Iteration 0, loss = 0.0199
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0043
--- Epoch 302 / 2000 - 302 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0271
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0016
--- Epoch 303 / 2000 - 303 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0027
--- Epoch 304 / 2000 - 304 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0195
Iteration 40, loss = 0.0165
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0058
--- Epoch 305 / 2000 - 305 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0123
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0086
--- Epoch 306 / 2000 - 306 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0055
--- Epoch 307 / 2000 - 307 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0093
--- Epoch 308 / 2000 - 308 epochs total
Iteration 0, loss = 0.0152
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0024
--- Epoch 309 / 2000 - 309 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0232
Iteration 40, loss = 0.0173
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0057
--- Epoch 310 / 2000 - 310 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0035
--- Epoch 311 / 2000 - 311 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0015
--- Epoch 312 / 2000 - 312 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0007
Iteration 40, loss = 0.0163
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0020
--- Epoch 313 / 2000 - 313 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0050
--- Epoch 314 / 2000 - 314 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0147
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0061
--- Epoch 315 / 2000 - 315 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0124
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0080
--- Epoch 316 / 2000 - 316 epochs total
Iteration 0, loss = 0.0306
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0030
--- Epoch 317 / 2000 - 317 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0083
Iteration 60, loss = 0.0306
Iteration 80, loss = 0.0042
--- Epoch 318 / 2000 - 318 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0281
Iteration 80, loss = 0.0022
--- Epoch 319 / 2000 - 319 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0031
--- Epoch 320 / 2000 - 320 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0042
--- Epoch 321 / 2000 - 321 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0075
--- Epoch 322 / 2000 - 322 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0099
--- Epoch 323 / 2000 - 323 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0168
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0017
--- Epoch 324 / 2000 - 324 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0079
--- Epoch 325 / 2000 - 325 epochs total
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0013
--- Epoch 326 / 2000 - 326 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0072
--- Epoch 327 / 2000 - 327 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0143
--- Epoch 328 / 2000 - 328 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0350
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0051
--- Epoch 329 / 2000 - 329 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0120
Iteration 80, loss = 0.0078
--- Epoch 330 / 2000 - 330 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0306
Iteration 80, loss = 0.0029
--- Epoch 331 / 2000 - 331 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0147
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0106
--- Epoch 332 / 2000 - 332 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0020
--- Epoch 333 / 2000 - 333 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0182
--- Epoch 334 / 2000 - 334 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0009
Iteration 80, loss = 0.0074
--- Epoch 335 / 2000 - 335 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0110
--- Epoch 336 / 2000 - 336 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0039
--- Epoch 337 / 2000 - 337 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0210
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0137
--- Epoch 338 / 2000 - 338 epochs total
Iteration 0, loss = 0.0182
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0019
--- Epoch 339 / 2000 - 339 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0034
--- Epoch 340 / 2000 - 340 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0186
--- Epoch 341 / 2000 - 341 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0099
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0023
--- Epoch 342 / 2000 - 342 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0294
--- Epoch 343 / 2000 - 343 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0021
--- Epoch 344 / 2000 - 344 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0228
--- Epoch 345 / 2000 - 345 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0081
--- Epoch 346 / 2000 - 346 epochs total
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0110
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0127
--- Epoch 347 / 2000 - 347 epochs total
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0141
Iteration 40, loss = 0.0139
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0063
--- Epoch 348 / 2000 - 348 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0042
--- Epoch 349 / 2000 - 349 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0176
--- Epoch 350 / 2000 - 350 epochs total
Iteration 0, loss = 0.0226
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0041
--- Epoch 351 / 2000 - 351 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0039
--- Epoch 352 / 2000 - 352 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0028
--- Epoch 353 / 2000 - 353 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0131
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0051
--- Epoch 354 / 2000 - 354 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0023
--- Epoch 355 / 2000 - 355 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0130
--- Epoch 356 / 2000 - 356 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0089
--- Epoch 357 / 2000 - 357 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0059
--- Epoch 358 / 2000 - 358 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0017
--- Epoch 359 / 2000 - 359 epochs total
Iteration 0, loss = 0.0380
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0089
--- Epoch 360 / 2000 - 360 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0026
--- Epoch 361 / 2000 - 361 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0192
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0054
--- Epoch 362 / 2000 - 362 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0101
Iteration 80, loss = 0.0010
--- Epoch 363 / 2000 - 363 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0048
--- Epoch 364 / 2000 - 364 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0016
--- Epoch 365 / 2000 - 365 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0251
Iteration 80, loss = 0.0017
--- Epoch 366 / 2000 - 366 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0095
--- Epoch 367 / 2000 - 367 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0019
--- Epoch 368 / 2000 - 368 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0037
--- Epoch 369 / 2000 - 369 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0117
Iteration 40, loss = 0.0243
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0033
--- Epoch 370 / 2000 - 370 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0254
--- Epoch 371 / 2000 - 371 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0119
--- Epoch 372 / 2000 - 372 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0049
--- Epoch 373 / 2000 - 373 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0198
Iteration 80, loss = 0.0058
--- Epoch 374 / 2000 - 374 epochs total
Iteration 0, loss = 0.0346
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0031
--- Epoch 375 / 2000 - 375 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0166
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0143
--- Epoch 376 / 2000 - 376 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0019
--- Epoch 377 / 2000 - 377 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0193
--- Epoch 378 / 2000 - 378 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0039
--- Epoch 379 / 2000 - 379 epochs total
Iteration 0, loss = 0.0201
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0015
--- Epoch 380 / 2000 - 380 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0073
--- Epoch 381 / 2000 - 381 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0085
--- Epoch 382 / 2000 - 382 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0051
--- Epoch 383 / 2000 - 383 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0259
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0026
--- Epoch 384 / 2000 - 384 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0021
--- Epoch 385 / 2000 - 385 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0084
--- Epoch 386 / 2000 - 386 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0038
--- Epoch 387 / 2000 - 387 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0166
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0045
--- Epoch 388 / 2000 - 388 epochs total
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0116
--- Epoch 389 / 2000 - 389 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0046
--- Epoch 390 / 2000 - 390 epochs total
Iteration 0, loss = 0.0140
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0092
--- Epoch 391 / 2000 - 391 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0326
--- Epoch 392 / 2000 - 392 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0282
Iteration 60, loss = 0.0199
Iteration 80, loss = 0.0041
--- Epoch 393 / 2000 - 393 epochs total
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0178
--- Epoch 394 / 2000 - 394 epochs total
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0053
--- Epoch 395 / 2000 - 395 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0049
--- Epoch 396 / 2000 - 396 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0087
--- Epoch 397 / 2000 - 397 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0091
--- Epoch 398 / 2000 - 398 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0122
--- Epoch 399 / 2000 - 399 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0027
--- Epoch 400 / 2000 - 400 epochs total
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0044
--- Epoch 401 / 2000 - 401 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0287
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0064
--- Epoch 402 / 2000 - 402 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0131
--- Epoch 403 / 2000 - 403 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0025
--- Epoch 404 / 2000 - 404 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0038
--- Epoch 405 / 2000 - 405 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0039
--- Epoch 406 / 2000 - 406 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0187
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0014
--- Epoch 407 / 2000 - 407 epochs total
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0157
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0074
--- Epoch 408 / 2000 - 408 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0352
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0013
--- Epoch 409 / 2000 - 409 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0034
--- Epoch 410 / 2000 - 410 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0048
--- Epoch 411 / 2000 - 411 epochs total
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0055
--- Epoch 412 / 2000 - 412 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0320
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0021
--- Epoch 413 / 2000 - 413 epochs total
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0046
--- Epoch 414 / 2000 - 414 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0044
--- Epoch 415 / 2000 - 415 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0036
--- Epoch 416 / 2000 - 416 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0045
--- Epoch 417 / 2000 - 417 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0026
--- Epoch 418 / 2000 - 418 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0337
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0070
--- Epoch 419 / 2000 - 419 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0078
--- Epoch 420 / 2000 - 420 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0036
--- Epoch 421 / 2000 - 421 epochs total
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0039
--- Epoch 422 / 2000 - 422 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0137
--- Epoch 423 / 2000 - 423 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0010
--- Epoch 424 / 2000 - 424 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0025
--- Epoch 425 / 2000 - 425 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0188
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0040
--- Epoch 426 / 2000 - 426 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0100
--- Epoch 427 / 2000 - 427 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0232
--- Epoch 428 / 2000 - 428 epochs total
Iteration 0, loss = 0.0138
Iteration 20, loss = 0.0378
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0029
--- Epoch 429 / 2000 - 429 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0023
--- Epoch 430 / 2000 - 430 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0052
--- Epoch 431 / 2000 - 431 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0025
--- Epoch 432 / 2000 - 432 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0051
--- Epoch 433 / 2000 - 433 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0052
--- Epoch 434 / 2000 - 434 epochs total
Iteration 0, loss = 0.0181
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0029
--- Epoch 435 / 2000 - 435 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0059
--- Epoch 436 / 2000 - 436 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0144
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0059
--- Epoch 437 / 2000 - 437 epochs total
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0065
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0165
Iteration 80, loss = 0.0089
--- Epoch 438 / 2000 - 438 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0007
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0089
--- Epoch 439 / 2000 - 439 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0207
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0024
--- Epoch 440 / 2000 - 440 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0048
--- Epoch 441 / 2000 - 441 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0121
--- Epoch 442 / 2000 - 442 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0062
--- Epoch 443 / 2000 - 443 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0200
--- Epoch 444 / 2000 - 444 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0057
--- Epoch 445 / 2000 - 445 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0018
--- Epoch 446 / 2000 - 446 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0038
--- Epoch 447 / 2000 - 447 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0018
--- Epoch 448 / 2000 - 448 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0267
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0015
--- Epoch 449 / 2000 - 449 epochs total
Iteration 0, loss = 0.0196
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0028
--- Epoch 450 / 2000 - 450 epochs total
Iteration 0, loss = 0.0289
Iteration 20, loss = 0.0190
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0062
--- Epoch 451 / 2000 - 451 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0106
--- Epoch 452 / 2000 - 452 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0037
--- Epoch 453 / 2000 - 453 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0048
--- Epoch 454 / 2000 - 454 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0084
--- Epoch 455 / 2000 - 455 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0016
--- Epoch 456 / 2000 - 456 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0135
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0038
--- Epoch 457 / 2000 - 457 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0020
--- Epoch 458 / 2000 - 458 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0101
Iteration 80, loss = 0.0043
--- Epoch 459 / 2000 - 459 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0248
Iteration 80, loss = 0.0038
--- Epoch 460 / 2000 - 460 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0098
--- Epoch 461 / 2000 - 461 epochs total
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0136
--- Epoch 462 / 2000 - 462 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0042
--- Epoch 463 / 2000 - 463 epochs total
Iteration 0, loss = 0.0331
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0039
--- Epoch 464 / 2000 - 464 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0032
--- Epoch 465 / 2000 - 465 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0107
--- Epoch 466 / 2000 - 466 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0075
--- Epoch 467 / 2000 - 467 epochs total
Iteration 0, loss = 0.0231
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0101
--- Epoch 468 / 2000 - 468 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0075
--- Epoch 469 / 2000 - 469 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0037
--- Epoch 470 / 2000 - 470 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0440
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0019
--- Epoch 471 / 2000 - 471 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0019
--- Epoch 472 / 2000 - 472 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0121
--- Epoch 473 / 2000 - 473 epochs total
Iteration 0, loss = 0.0266
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0121
Iteration 80, loss = 0.0022
--- Epoch 474 / 2000 - 474 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0043
--- Epoch 475 / 2000 - 475 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0037
--- Epoch 476 / 2000 - 476 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0021
--- Epoch 477 / 2000 - 477 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0040
--- Epoch 478 / 2000 - 478 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0124
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0171
Iteration 80, loss = 0.0084
--- Epoch 479 / 2000 - 479 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0085
--- Epoch 480 / 2000 - 480 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0154
--- Epoch 481 / 2000 - 481 epochs total
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0022
--- Epoch 482 / 2000 - 482 epochs total
Iteration 0, loss = 0.0183
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0097
--- Epoch 483 / 2000 - 483 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0019
--- Epoch 484 / 2000 - 484 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0263
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0105
--- Epoch 485 / 2000 - 485 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0154
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0077
--- Epoch 486 / 2000 - 486 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0062
--- Epoch 487 / 2000 - 487 epochs total
Iteration 0, loss = 0.0347
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0028
--- Epoch 488 / 2000 - 488 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0085
--- Epoch 489 / 2000 - 489 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0028
--- Epoch 490 / 2000 - 490 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0216
Iteration 60, loss = 0.0236
Iteration 80, loss = 0.0053
--- Epoch 491 / 2000 - 491 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0180
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0122
--- Epoch 492 / 2000 - 492 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0013
--- Epoch 493 / 2000 - 493 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0034
--- Epoch 494 / 2000 - 494 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0011
--- Epoch 495 / 2000 - 495 epochs total
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0188
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0012
--- Epoch 496 / 2000 - 496 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0062
--- Epoch 497 / 2000 - 497 epochs total
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0057
--- Epoch 498 / 2000 - 498 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0183
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0045
--- Epoch 499 / 2000 - 499 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0144
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0021
--- Epoch 500 / 2000 - 500 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0033
--- Epoch 501 / 2000 - 501 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0017
--- Epoch 502 / 2000 - 502 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0151
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0016
--- Epoch 503 / 2000 - 503 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0025
--- Epoch 504 / 2000 - 504 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0129
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0074
--- Epoch 505 / 2000 - 505 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0249
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0054
--- Epoch 506 / 2000 - 506 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0068
--- Epoch 507 / 2000 - 507 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0102
--- Epoch 508 / 2000 - 508 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0309
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0050
--- Epoch 509 / 2000 - 509 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0013
--- Epoch 510 / 2000 - 510 epochs total
Iteration 0, loss = 0.0097
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0047
--- Epoch 511 / 2000 - 511 epochs total
Iteration 0, loss = 0.0130
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0241
Iteration 80, loss = 0.0061
--- Epoch 512 / 2000 - 512 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0080
--- Epoch 513 / 2000 - 513 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0017
--- Epoch 514 / 2000 - 514 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0105
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0068
--- Epoch 515 / 2000 - 515 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0027
--- Epoch 516 / 2000 - 516 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0051
--- Epoch 517 / 2000 - 517 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0150
--- Epoch 518 / 2000 - 518 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0060
--- Epoch 519 / 2000 - 519 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0187
--- Epoch 520 / 2000 - 520 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0207
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0122
--- Epoch 521 / 2000 - 521 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0233
--- Epoch 522 / 2000 - 522 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0033
--- Epoch 523 / 2000 - 523 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0034
--- Epoch 524 / 2000 - 524 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0054
--- Epoch 525 / 2000 - 525 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0040
--- Epoch 526 / 2000 - 526 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0034
--- Epoch 527 / 2000 - 527 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0071
--- Epoch 528 / 2000 - 528 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0169
Iteration 80, loss = 0.0145
--- Epoch 529 / 2000 - 529 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0198
Iteration 80, loss = 0.0070
--- Epoch 530 / 2000 - 530 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0016
--- Epoch 531 / 2000 - 531 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0023
--- Epoch 532 / 2000 - 532 epochs total
Iteration 0, loss = 0.0165
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0050
--- Epoch 533 / 2000 - 533 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0155
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0069
--- Epoch 534 / 2000 - 534 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0057
--- Epoch 535 / 2000 - 535 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0300
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0167
--- Epoch 536 / 2000 - 536 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0025
--- Epoch 537 / 2000 - 537 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0192
--- Epoch 538 / 2000 - 538 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0026
--- Epoch 539 / 2000 - 539 epochs total
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0189
Iteration 40, loss = 0.0110
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0027
--- Epoch 540 / 2000 - 540 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0013
--- Epoch 541 / 2000 - 541 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0101
Iteration 80, loss = 0.0094
--- Epoch 542 / 2000 - 542 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0125
Iteration 80, loss = 0.0085
--- Epoch 543 / 2000 - 543 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0082
--- Epoch 544 / 2000 - 544 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0099
--- Epoch 545 / 2000 - 545 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0046
--- Epoch 546 / 2000 - 546 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0101
Iteration 80, loss = 0.0049
--- Epoch 547 / 2000 - 547 epochs total
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0131
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0034
--- Epoch 548 / 2000 - 548 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0245
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0091
--- Epoch 549 / 2000 - 549 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0123
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0013
--- Epoch 550 / 2000 - 550 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0020
--- Epoch 551 / 2000 - 551 epochs total
Iteration 0, loss = 0.0123
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0023
--- Epoch 552 / 2000 - 552 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0068
--- Epoch 553 / 2000 - 553 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0080
--- Epoch 554 / 2000 - 554 epochs total
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0050
--- Epoch 555 / 2000 - 555 epochs total
Iteration 0, loss = 0.0123
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0106
--- Epoch 556 / 2000 - 556 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0023
--- Epoch 557 / 2000 - 557 epochs total
Iteration 0, loss = 0.0231
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0068
--- Epoch 558 / 2000 - 558 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0064
--- Epoch 559 / 2000 - 559 epochs total
Iteration 0, loss = 0.0181
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0020
--- Epoch 560 / 2000 - 560 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0114
--- Epoch 561 / 2000 - 561 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0048
--- Epoch 562 / 2000 - 562 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0097
Iteration 80, loss = 0.0022
--- Epoch 563 / 2000 - 563 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0065
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0076
--- Epoch 564 / 2000 - 564 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0054
--- Epoch 565 / 2000 - 565 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0050
--- Epoch 566 / 2000 - 566 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0035
--- Epoch 567 / 2000 - 567 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0093
--- Epoch 568 / 2000 - 568 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0083
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0231
--- Epoch 569 / 2000 - 569 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0144
--- Epoch 570 / 2000 - 570 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0123
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0034
--- Epoch 571 / 2000 - 571 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0031
--- Epoch 572 / 2000 - 572 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0074
--- Epoch 573 / 2000 - 573 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0119
--- Epoch 574 / 2000 - 574 epochs total
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0035
--- Epoch 575 / 2000 - 575 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0137
--- Epoch 576 / 2000 - 576 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0063
--- Epoch 577 / 2000 - 577 epochs total
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0015
--- Epoch 578 / 2000 - 578 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0037
--- Epoch 579 / 2000 - 579 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0045
--- Epoch 580 / 2000 - 580 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0016
--- Epoch 581 / 2000 - 581 epochs total
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0016
--- Epoch 582 / 2000 - 582 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0071
--- Epoch 583 / 2000 - 583 epochs total
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0065
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0105
--- Epoch 584 / 2000 - 584 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0030
--- Epoch 585 / 2000 - 585 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0022
--- Epoch 586 / 2000 - 586 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0022
--- Epoch 587 / 2000 - 587 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0041
--- Epoch 588 / 2000 - 588 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0133
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0043
--- Epoch 589 / 2000 - 589 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0053
--- Epoch 590 / 2000 - 590 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0035
--- Epoch 591 / 2000 - 591 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0019
--- Epoch 592 / 2000 - 592 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0116
Iteration 80, loss = 0.0054
--- Epoch 593 / 2000 - 593 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0090
--- Epoch 594 / 2000 - 594 epochs total
Iteration 0, loss = 0.0493
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0032
--- Epoch 595 / 2000 - 595 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0121
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0083
--- Epoch 596 / 2000 - 596 epochs total
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0023
--- Epoch 597 / 2000 - 597 epochs total
Iteration 0, loss = 0.0204
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0157
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0025
--- Epoch 598 / 2000 - 598 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0037
--- Epoch 599 / 2000 - 599 epochs total
Iteration 0, loss = 0.0223
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0025
--- Epoch 600 / 2000 - 600 epochs total
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0105
Iteration 60, loss = 0.0131
Iteration 80, loss = 0.0039
--- Epoch 601 / 2000 - 601 epochs total
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0234
Iteration 80, loss = 0.0014
--- Epoch 602 / 2000 - 602 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0078
--- Epoch 603 / 2000 - 603 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0009
Iteration 80, loss = 0.0038
--- Epoch 604 / 2000 - 604 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0093
--- Epoch 605 / 2000 - 605 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0041
--- Epoch 606 / 2000 - 606 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0136
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0116
--- Epoch 607 / 2000 - 607 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0176
Iteration 80, loss = 0.0027
--- Epoch 608 / 2000 - 608 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0055
--- Epoch 609 / 2000 - 609 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0078
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0104
--- Epoch 610 / 2000 - 610 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0215
--- Epoch 611 / 2000 - 611 epochs total
Iteration 0, loss = 0.0215
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0220
Iteration 80, loss = 0.0020
--- Epoch 612 / 2000 - 612 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0047
--- Epoch 613 / 2000 - 613 epochs total
Iteration 0, loss = 0.0204
Iteration 20, loss = 0.0145
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0118
--- Epoch 614 / 2000 - 614 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0013
--- Epoch 615 / 2000 - 615 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0218
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0045
--- Epoch 616 / 2000 - 616 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0027
--- Epoch 617 / 2000 - 617 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0060
--- Epoch 618 / 2000 - 618 epochs total
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0037
--- Epoch 619 / 2000 - 619 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0037
--- Epoch 620 / 2000 - 620 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0102
Iteration 80, loss = 0.0130
--- Epoch 621 / 2000 - 621 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0037
--- Epoch 622 / 2000 - 622 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0136
Iteration 80, loss = 0.0023
--- Epoch 623 / 2000 - 623 epochs total
Iteration 0, loss = 0.0083
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0069
--- Epoch 624 / 2000 - 624 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0144
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0071
--- Epoch 625 / 2000 - 625 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0010
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0275
--- Epoch 626 / 2000 - 626 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0017
--- Epoch 627 / 2000 - 627 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0121
--- Epoch 628 / 2000 - 628 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0030
--- Epoch 629 / 2000 - 629 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0017
--- Epoch 630 / 2000 - 630 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0064
--- Epoch 631 / 2000 - 631 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0044
--- Epoch 632 / 2000 - 632 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0163
Iteration 80, loss = 0.0009
--- Epoch 633 / 2000 - 633 epochs total
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0019
--- Epoch 634 / 2000 - 634 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0075
--- Epoch 635 / 2000 - 635 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0140
--- Epoch 636 / 2000 - 636 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0058
--- Epoch 637 / 2000 - 637 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0069
--- Epoch 638 / 2000 - 638 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0155
Iteration 80, loss = 0.0028
--- Epoch 639 / 2000 - 639 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0233
Iteration 80, loss = 0.0108
--- Epoch 640 / 2000 - 640 epochs total
Iteration 0, loss = 0.0103
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0017
--- Epoch 641 / 2000 - 641 epochs total
Iteration 0, loss = 0.0097
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0042
--- Epoch 642 / 2000 - 642 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0226
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0025
--- Epoch 643 / 2000 - 643 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0041
--- Epoch 644 / 2000 - 644 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0072
--- Epoch 645 / 2000 - 645 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0028
--- Epoch 646 / 2000 - 646 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0190
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0037
--- Epoch 647 / 2000 - 647 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0173
--- Epoch 648 / 2000 - 648 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0080
--- Epoch 649 / 2000 - 649 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0028
--- Epoch 650 / 2000 - 650 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0128
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0034
--- Epoch 651 / 2000 - 651 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0025
--- Epoch 652 / 2000 - 652 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0019
--- Epoch 653 / 2000 - 653 epochs total
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0028
--- Epoch 654 / 2000 - 654 epochs total
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0350
--- Epoch 655 / 2000 - 655 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0056
--- Epoch 656 / 2000 - 656 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0124
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0018
--- Epoch 657 / 2000 - 657 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0019
--- Epoch 658 / 2000 - 658 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0024
--- Epoch 659 / 2000 - 659 epochs total
Iteration 0, loss = 0.0243
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0057
--- Epoch 660 / 2000 - 660 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0279
Iteration 80, loss = 0.0022
--- Epoch 661 / 2000 - 661 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0031
--- Epoch 662 / 2000 - 662 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0076
--- Epoch 663 / 2000 - 663 epochs total
Iteration 0, loss = 0.0215
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0033
--- Epoch 664 / 2000 - 664 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0058
--- Epoch 665 / 2000 - 665 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0363
--- Epoch 666 / 2000 - 666 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0043
--- Epoch 667 / 2000 - 667 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0015
--- Epoch 668 / 2000 - 668 epochs total
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0130
--- Epoch 669 / 2000 - 669 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0021
--- Epoch 670 / 2000 - 670 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0124
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0141
--- Epoch 671 / 2000 - 671 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0038
--- Epoch 672 / 2000 - 672 epochs total
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0224
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0015
--- Epoch 673 / 2000 - 673 epochs total
Iteration 0, loss = 0.0245
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0147
--- Epoch 674 / 2000 - 674 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0102
--- Epoch 675 / 2000 - 675 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0449
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0025
--- Epoch 676 / 2000 - 676 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0163
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0040
--- Epoch 677 / 2000 - 677 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0013
--- Epoch 678 / 2000 - 678 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0017
--- Epoch 679 / 2000 - 679 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0231
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0129
--- Epoch 680 / 2000 - 680 epochs total
Iteration 0, loss = 0.0220
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0149
--- Epoch 681 / 2000 - 681 epochs total
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0016
--- Epoch 682 / 2000 - 682 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0051
--- Epoch 683 / 2000 - 683 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0014
--- Epoch 684 / 2000 - 684 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0203
Iteration 80, loss = 0.0036
--- Epoch 685 / 2000 - 685 epochs total
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0365
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0044
--- Epoch 686 / 2000 - 686 epochs total
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0025
--- Epoch 687 / 2000 - 687 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0027
--- Epoch 688 / 2000 - 688 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0062
--- Epoch 689 / 2000 - 689 epochs total
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0023
--- Epoch 690 / 2000 - 690 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0051
--- Epoch 691 / 2000 - 691 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0022
--- Epoch 692 / 2000 - 692 epochs total
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0051
--- Epoch 693 / 2000 - 693 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0052
--- Epoch 694 / 2000 - 694 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0035
--- Epoch 695 / 2000 - 695 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0087
--- Epoch 696 / 2000 - 696 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0025
--- Epoch 697 / 2000 - 697 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0069
--- Epoch 698 / 2000 - 698 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0044
--- Epoch 699 / 2000 - 699 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0014
--- Epoch 700 / 2000 - 700 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0113
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0039
--- Epoch 701 / 2000 - 701 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0210
--- Epoch 702 / 2000 - 702 epochs total
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0021
--- Epoch 703 / 2000 - 703 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0025
--- Epoch 704 / 2000 - 704 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0187
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0193
--- Epoch 705 / 2000 - 705 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0228
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0015
--- Epoch 706 / 2000 - 706 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0037
--- Epoch 707 / 2000 - 707 epochs total
Iteration 0, loss = 0.0180
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0032
--- Epoch 708 / 2000 - 708 epochs total
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0064
--- Epoch 709 / 2000 - 709 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0037
--- Epoch 710 / 2000 - 710 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0061
--- Epoch 711 / 2000 - 711 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0146
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0051
--- Epoch 712 / 2000 - 712 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0164
Iteration 80, loss = 0.0024
--- Epoch 713 / 2000 - 713 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0044
--- Epoch 714 / 2000 - 714 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0131
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0025
--- Epoch 715 / 2000 - 715 epochs total
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0045
--- Epoch 716 / 2000 - 716 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0020
--- Epoch 717 / 2000 - 717 epochs total
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0057
--- Epoch 718 / 2000 - 718 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0188
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0052
--- Epoch 719 / 2000 - 719 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0027
--- Epoch 720 / 2000 - 720 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0047
--- Epoch 721 / 2000 - 721 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0018
--- Epoch 722 / 2000 - 722 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0081
--- Epoch 723 / 2000 - 723 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0051
--- Epoch 724 / 2000 - 724 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0143
--- Epoch 725 / 2000 - 725 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0027
--- Epoch 726 / 2000 - 726 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0026
--- Epoch 727 / 2000 - 727 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0219
Iteration 80, loss = 0.0044
--- Epoch 728 / 2000 - 728 epochs total
Iteration 0, loss = 0.0120
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0206
--- Epoch 729 / 2000 - 729 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0124
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0067
--- Epoch 730 / 2000 - 730 epochs total
Iteration 0, loss = 0.0207
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0064
--- Epoch 731 / 2000 - 731 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0098
--- Epoch 732 / 2000 - 732 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0045
--- Epoch 733 / 2000 - 733 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0037
--- Epoch 734 / 2000 - 734 epochs total
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0052
--- Epoch 735 / 2000 - 735 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0055
--- Epoch 736 / 2000 - 736 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0022
--- Epoch 737 / 2000 - 737 epochs total
Iteration 0, loss = 0.0128
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0096
--- Epoch 738 / 2000 - 738 epochs total
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0018
--- Epoch 739 / 2000 - 739 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0148
Iteration 60, loss = 0.0213
Iteration 80, loss = 0.0022
--- Epoch 740 / 2000 - 740 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0067
--- Epoch 741 / 2000 - 741 epochs total
Iteration 0, loss = 0.0208
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0081
--- Epoch 742 / 2000 - 742 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0066
--- Epoch 743 / 2000 - 743 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0370
--- Epoch 744 / 2000 - 744 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0036
--- Epoch 745 / 2000 - 745 epochs total
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0142
--- Epoch 746 / 2000 - 746 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0299
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0050
--- Epoch 747 / 2000 - 747 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0124
--- Epoch 748 / 2000 - 748 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0031
--- Epoch 749 / 2000 - 749 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0142
--- Epoch 750 / 2000 - 750 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0067
--- Epoch 751 / 2000 - 751 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0057
--- Epoch 752 / 2000 - 752 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0031
--- Epoch 753 / 2000 - 753 epochs total
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0152
--- Epoch 754 / 2000 - 754 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0178
Iteration 60, loss = 0.0007
Iteration 80, loss = 0.0063
--- Epoch 755 / 2000 - 755 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0021
--- Epoch 756 / 2000 - 756 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0056
--- Epoch 757 / 2000 - 757 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0041
--- Epoch 758 / 2000 - 758 epochs total
Iteration 0, loss = 0.0302
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0024
--- Epoch 759 / 2000 - 759 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0066
--- Epoch 760 / 2000 - 760 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0159
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0063
--- Epoch 761 / 2000 - 761 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0042
--- Epoch 762 / 2000 - 762 epochs total
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0042
--- Epoch 763 / 2000 - 763 epochs total
Iteration 0, loss = 0.0082
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0028
--- Epoch 764 / 2000 - 764 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0019
--- Epoch 765 / 2000 - 765 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0112
--- Epoch 766 / 2000 - 766 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0034
--- Epoch 767 / 2000 - 767 epochs total
Iteration 0, loss = 0.0235
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0026
--- Epoch 768 / 2000 - 768 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0067
--- Epoch 769 / 2000 - 769 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0073
--- Epoch 770 / 2000 - 770 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0014
--- Epoch 771 / 2000 - 771 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0035
--- Epoch 772 / 2000 - 772 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0034
--- Epoch 773 / 2000 - 773 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0030
--- Epoch 774 / 2000 - 774 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0247
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0018
--- Epoch 775 / 2000 - 775 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0042
--- Epoch 776 / 2000 - 776 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0077
--- Epoch 777 / 2000 - 777 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0017
--- Epoch 778 / 2000 - 778 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0179
--- Epoch 779 / 2000 - 779 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0202
--- Epoch 780 / 2000 - 780 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0218
Iteration 80, loss = 0.0078
--- Epoch 781 / 2000 - 781 epochs total
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0035
--- Epoch 782 / 2000 - 782 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0020
--- Epoch 783 / 2000 - 783 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0020
--- Epoch 784 / 2000 - 784 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0042
--- Epoch 785 / 2000 - 785 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0062
--- Epoch 786 / 2000 - 786 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0026
--- Epoch 787 / 2000 - 787 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0067
--- Epoch 788 / 2000 - 788 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0080
--- Epoch 789 / 2000 - 789 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0058
--- Epoch 790 / 2000 - 790 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0123
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0073
--- Epoch 791 / 2000 - 791 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0067
--- Epoch 792 / 2000 - 792 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0074
--- Epoch 793 / 2000 - 793 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0011
--- Epoch 794 / 2000 - 794 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0040
--- Epoch 795 / 2000 - 795 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0063
--- Epoch 796 / 2000 - 796 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0186
--- Epoch 797 / 2000 - 797 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0049
--- Epoch 798 / 2000 - 798 epochs total
Iteration 0, loss = 0.0136
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0009
Iteration 60, loss = 0.0132
Iteration 80, loss = 0.0045
--- Epoch 799 / 2000 - 799 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0152
--- Epoch 800 / 2000 - 800 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0033
--- Epoch 801 / 2000 - 801 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0037
--- Epoch 802 / 2000 - 802 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0045
--- Epoch 803 / 2000 - 803 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0068
--- Epoch 804 / 2000 - 804 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0071
--- Epoch 805 / 2000 - 805 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0115
Iteration 80, loss = 0.0075
--- Epoch 806 / 2000 - 806 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0051
--- Epoch 807 / 2000 - 807 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0019
--- Epoch 808 / 2000 - 808 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0122
--- Epoch 809 / 2000 - 809 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0098
--- Epoch 810 / 2000 - 810 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0051
--- Epoch 811 / 2000 - 811 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0121
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0053
--- Epoch 812 / 2000 - 812 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0071
--- Epoch 813 / 2000 - 813 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0162
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0063
--- Epoch 814 / 2000 - 814 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0031
--- Epoch 815 / 2000 - 815 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0020
--- Epoch 816 / 2000 - 816 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0062
--- Epoch 817 / 2000 - 817 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0087
--- Epoch 818 / 2000 - 818 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0201
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0053
--- Epoch 819 / 2000 - 819 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0031
--- Epoch 820 / 2000 - 820 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0031
--- Epoch 821 / 2000 - 821 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0110
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0048
--- Epoch 822 / 2000 - 822 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0027
--- Epoch 823 / 2000 - 823 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0067
--- Epoch 824 / 2000 - 824 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0047
--- Epoch 825 / 2000 - 825 epochs total
Iteration 0, loss = 0.0082
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0113
--- Epoch 826 / 2000 - 826 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0030
--- Epoch 827 / 2000 - 827 epochs total
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0008
Iteration 80, loss = 0.0098
--- Epoch 828 / 2000 - 828 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0602
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0048
--- Epoch 829 / 2000 - 829 epochs total
Iteration 0, loss = 0.0170
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0070
--- Epoch 830 / 2000 - 830 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0059
--- Epoch 831 / 2000 - 831 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0144
Iteration 80, loss = 0.0093
--- Epoch 832 / 2000 - 832 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0113
--- Epoch 833 / 2000 - 833 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0183
Iteration 60, loss = 0.0216
Iteration 80, loss = 0.0108
--- Epoch 834 / 2000 - 834 epochs total
Iteration 0, loss = 0.0097
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0025
--- Epoch 835 / 2000 - 835 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0047
--- Epoch 836 / 2000 - 836 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0102
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0045
--- Epoch 837 / 2000 - 837 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0081
--- Epoch 838 / 2000 - 838 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0062
--- Epoch 839 / 2000 - 839 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0033
--- Epoch 840 / 2000 - 840 epochs total
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0020
--- Epoch 841 / 2000 - 841 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0022
--- Epoch 842 / 2000 - 842 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0071
--- Epoch 843 / 2000 - 843 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0204
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0029
--- Epoch 844 / 2000 - 844 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0028
--- Epoch 845 / 2000 - 845 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0105
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0017
--- Epoch 846 / 2000 - 846 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0145
--- Epoch 847 / 2000 - 847 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0023
--- Epoch 848 / 2000 - 848 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0032
--- Epoch 849 / 2000 - 849 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0049
--- Epoch 850 / 2000 - 850 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0035
--- Epoch 851 / 2000 - 851 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0138
--- Epoch 852 / 2000 - 852 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0054
--- Epoch 853 / 2000 - 853 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0035
--- Epoch 854 / 2000 - 854 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0127
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0034
--- Epoch 855 / 2000 - 855 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0102
Iteration 80, loss = 0.0108
--- Epoch 856 / 2000 - 856 epochs total
Iteration 0, loss = 0.0103
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0036
--- Epoch 857 / 2000 - 857 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0061
--- Epoch 858 / 2000 - 858 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0070
--- Epoch 859 / 2000 - 859 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0034
--- Epoch 860 / 2000 - 860 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0018
--- Epoch 861 / 2000 - 861 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0095
--- Epoch 862 / 2000 - 862 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0045
--- Epoch 863 / 2000 - 863 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0050
--- Epoch 864 / 2000 - 864 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0048
--- Epoch 865 / 2000 - 865 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0085
--- Epoch 866 / 2000 - 866 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0205
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0077
--- Epoch 867 / 2000 - 867 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0022
--- Epoch 868 / 2000 - 868 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0204
Iteration 80, loss = 0.0031
--- Epoch 869 / 2000 - 869 epochs total
Iteration 0, loss = 0.0126
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0136
Iteration 80, loss = 0.0230
--- Epoch 870 / 2000 - 870 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0033
--- Epoch 871 / 2000 - 871 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0014
--- Epoch 872 / 2000 - 872 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0011
--- Epoch 873 / 2000 - 873 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0231
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0030
--- Epoch 874 / 2000 - 874 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0019
--- Epoch 875 / 2000 - 875 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0053
--- Epoch 876 / 2000 - 876 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0020
--- Epoch 877 / 2000 - 877 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0069
--- Epoch 878 / 2000 - 878 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0018
--- Epoch 879 / 2000 - 879 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0228
--- Epoch 880 / 2000 - 880 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0163
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0016
--- Epoch 881 / 2000 - 881 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0763
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0064
--- Epoch 882 / 2000 - 882 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0024
--- Epoch 883 / 2000 - 883 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0120
--- Epoch 884 / 2000 - 884 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0083
--- Epoch 885 / 2000 - 885 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0085
--- Epoch 886 / 2000 - 886 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0053
--- Epoch 887 / 2000 - 887 epochs total
Iteration 0, loss = 0.0180
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0015
--- Epoch 888 / 2000 - 888 epochs total
Iteration 0, loss = 0.0265
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0082
--- Epoch 889 / 2000 - 889 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0272
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0108
--- Epoch 890 / 2000 - 890 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0193
Iteration 80, loss = 0.0013
--- Epoch 891 / 2000 - 891 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0029
--- Epoch 892 / 2000 - 892 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0178
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0042
--- Epoch 893 / 2000 - 893 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0030
--- Epoch 894 / 2000 - 894 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0031
--- Epoch 895 / 2000 - 895 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0160
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0025
--- Epoch 896 / 2000 - 896 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0102
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0044
--- Epoch 897 / 2000 - 897 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0174
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0069
--- Epoch 898 / 2000 - 898 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0039
--- Epoch 899 / 2000 - 899 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0016
--- Epoch 900 / 2000 - 900 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0035
--- Epoch 901 / 2000 - 901 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0014
--- Epoch 902 / 2000 - 902 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0049
--- Epoch 903 / 2000 - 903 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0041
--- Epoch 904 / 2000 - 904 epochs total
Iteration 0, loss = 0.0245
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0249
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0033
--- Epoch 905 / 2000 - 905 epochs total
Iteration 0, loss = 0.0182
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0156
--- Epoch 906 / 2000 - 906 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0033
--- Epoch 907 / 2000 - 907 epochs total
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0021
--- Epoch 908 / 2000 - 908 epochs total
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0153
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0020
--- Epoch 909 / 2000 - 909 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0018
--- Epoch 910 / 2000 - 910 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0017
--- Epoch 911 / 2000 - 911 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0039
--- Epoch 912 / 2000 - 912 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0042
--- Epoch 913 / 2000 - 913 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0213
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0032
--- Epoch 914 / 2000 - 914 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0060
--- Epoch 915 / 2000 - 915 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0037
--- Epoch 916 / 2000 - 916 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0057
--- Epoch 917 / 2000 - 917 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0159
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0036
--- Epoch 918 / 2000 - 918 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0124
--- Epoch 919 / 2000 - 919 epochs total
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0183
Iteration 80, loss = 0.0018
--- Epoch 920 / 2000 - 920 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0029
--- Epoch 921 / 2000 - 921 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0066
--- Epoch 922 / 2000 - 922 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0018
--- Epoch 923 / 2000 - 923 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0129
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0012
--- Epoch 924 / 2000 - 924 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0102
--- Epoch 925 / 2000 - 925 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0040
--- Epoch 926 / 2000 - 926 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0050
--- Epoch 927 / 2000 - 927 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0100
--- Epoch 928 / 2000 - 928 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0035
--- Epoch 929 / 2000 - 929 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0031
--- Epoch 930 / 2000 - 930 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0009
Iteration 80, loss = 0.0015
--- Epoch 931 / 2000 - 931 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0091
--- Epoch 932 / 2000 - 932 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0024
--- Epoch 933 / 2000 - 933 epochs total
Iteration 0, loss = 0.0201
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0039
--- Epoch 934 / 2000 - 934 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0131
--- Epoch 935 / 2000 - 935 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0023
--- Epoch 936 / 2000 - 936 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0031
--- Epoch 937 / 2000 - 937 epochs total
Iteration 0, loss = 0.0178
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0095
--- Epoch 938 / 2000 - 938 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0129
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0028
--- Epoch 939 / 2000 - 939 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0016
--- Epoch 940 / 2000 - 940 epochs total
Iteration 0, loss = 0.0186
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0013
--- Epoch 941 / 2000 - 941 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0049
--- Epoch 942 / 2000 - 942 epochs total
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0024
--- Epoch 943 / 2000 - 943 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0085
--- Epoch 944 / 2000 - 944 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0189
Iteration 60, loss = 0.0325
Iteration 80, loss = 0.0051
--- Epoch 945 / 2000 - 945 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0053
--- Epoch 946 / 2000 - 946 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0231
Iteration 80, loss = 0.0047
--- Epoch 947 / 2000 - 947 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0164
--- Epoch 948 / 2000 - 948 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0012
--- Epoch 949 / 2000 - 949 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0041
--- Epoch 950 / 2000 - 950 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0041
--- Epoch 951 / 2000 - 951 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0029
--- Epoch 952 / 2000 - 952 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0190
--- Epoch 953 / 2000 - 953 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0091
--- Epoch 954 / 2000 - 954 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0033
--- Epoch 955 / 2000 - 955 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0008
--- Epoch 956 / 2000 - 956 epochs total
Iteration 0, loss = 0.0310
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0037
--- Epoch 957 / 2000 - 957 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0033
--- Epoch 958 / 2000 - 958 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0050
--- Epoch 959 / 2000 - 959 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0059
--- Epoch 960 / 2000 - 960 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0137
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0029
--- Epoch 961 / 2000 - 961 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0175
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0015
--- Epoch 962 / 2000 - 962 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0021
--- Epoch 963 / 2000 - 963 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0135
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0035
--- Epoch 964 / 2000 - 964 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0019
--- Epoch 965 / 2000 - 965 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0028
--- Epoch 966 / 2000 - 966 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0071
--- Epoch 967 / 2000 - 967 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0078
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0022
--- Epoch 968 / 2000 - 968 epochs total
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0013
--- Epoch 969 / 2000 - 969 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0021
--- Epoch 970 / 2000 - 970 epochs total
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0233
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0037
--- Epoch 971 / 2000 - 971 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0020
--- Epoch 972 / 2000 - 972 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0033
--- Epoch 973 / 2000 - 973 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0077
--- Epoch 974 / 2000 - 974 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0287
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0027
--- Epoch 975 / 2000 - 975 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0194
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0153
--- Epoch 976 / 2000 - 976 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0026
--- Epoch 977 / 2000 - 977 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0063
--- Epoch 978 / 2000 - 978 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0298
--- Epoch 979 / 2000 - 979 epochs total
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0090
--- Epoch 980 / 2000 - 980 epochs total
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0233
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0028
--- Epoch 981 / 2000 - 981 epochs total
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0014
--- Epoch 982 / 2000 - 982 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0051
--- Epoch 983 / 2000 - 983 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0012
--- Epoch 984 / 2000 - 984 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0014
--- Epoch 985 / 2000 - 985 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0226
Iteration 40, loss = 0.0113
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0027
--- Epoch 986 / 2000 - 986 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0013
--- Epoch 987 / 2000 - 987 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0051
--- Epoch 988 / 2000 - 988 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0087
--- Epoch 989 / 2000 - 989 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0020
--- Epoch 990 / 2000 - 990 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0053
--- Epoch 991 / 2000 - 991 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0182
--- Epoch 992 / 2000 - 992 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0027
--- Epoch 993 / 2000 - 993 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0017
--- Epoch 994 / 2000 - 994 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0250
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0019
--- Epoch 995 / 2000 - 995 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0012
--- Epoch 996 / 2000 - 996 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0044
--- Epoch 997 / 2000 - 997 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0201
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0054
--- Epoch 998 / 2000 - 998 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0032
--- Epoch 999 / 2000 - 999 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0098
--- Epoch 1000 / 2000 - 1000 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0112
--- Epoch 1001 / 2000 - 1001 epochs total
Iteration 0, loss = 0.0215
Iteration 20, loss = 0.0017
---------------------------------------------------------------------------
KeyboardInterrupt                         Traceback (most recent call last)
<ipython-input-117-e83bcd8f9b5f> in <module>
----> 1 train(model9, optimizer, epochs=2000, x_train=data["X_train_ship"],  y_train=data["y_train_ship"], criterion=nn.MSELoss())

<ipython-input-18-95dee9c67ab2> in train(model, optimizer, epochs, x_train, y_train, criterion)
     28             y = y_batch[t].to(device=device, dtype=dtype)
     29 
---> 30             scores = model(x)
     31 
     32             loss = criterion(scores.view(-1), y.view(-1))

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/module.py in _call_impl(self, *input, **kwargs)
    720             result = self._slow_forward(*input, **kwargs)
    721         else:
--> 722             result = self.forward(*input, **kwargs)
    723         for hook in itertools.chain(
    724                 _global_forward_hooks.values(),

<ipython-input-24-48b049d402e0> in forward(self, x)
     25 
     26         # Encoder
---> 27         scores = F.relu(self.batchnorm1(self.conv1(x)))
     28         scores = F.relu(self.batchnorm2(self.conv2(scores)))
     29         scores = F.relu(self.batchnorm3(self.conv3(scores)))

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/module.py in _call_impl(self, *input, **kwargs)
    720             result = self._slow_forward(*input, **kwargs)
    721         else:
--> 722             result = self.forward(*input, **kwargs)
    723         for hook in itertools.chain(
    724                 _global_forward_hooks.values(),

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/conv.py in forward(self, input)
    417 
    418     def forward(self, input: Tensor) -> Tensor:
--> 419         return self._conv_forward(input, self.weight)
    420 
    421 class Conv3d(_ConvNd):

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/conv.py in _conv_forward(self, input, weight)
    414                             _pair(0), self.dilation, self.groups)
    415         return F.conv2d(input, weight, self.bias, self.stride,
--> 416                         self.padding, self.dilation, self.groups)
    417 
    418     def forward(self, input: Tensor) -> Tensor:

KeyboardInterrupt: 
In [120]:
testModel(model9, x_test=data["X_test_ship"], y_test=data["y_test_ship"], criterion=nn.MSELoss())
In [47]:
learning_rate = 1e-2
model11 = ConvNet4()
optimizer = optim.SGD(model11.parameters(), lr=learning_rate)
In [130]:
train(model11, optimizer, epochs=419, x_train=data["X_train_frog"],  y_train=data["y_train_frog"], criterion=nn.MSELoss())
--- Epoch 1 / 419 - 2582 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0044
--- Epoch 2 / 419 - 2583 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0045
--- Epoch 3 / 419 - 2584 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0018
--- Epoch 4 / 419 - 2585 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0158
Iteration 80, loss = 0.0029
--- Epoch 5 / 419 - 2586 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0019
--- Epoch 6 / 419 - 2587 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0066
--- Epoch 7 / 419 - 2588 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0035
--- Epoch 8 / 419 - 2589 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0025
--- Epoch 9 / 419 - 2590 epochs total
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0027
--- Epoch 10 / 419 - 2591 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0013
--- Epoch 11 / 419 - 2592 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0020
--- Epoch 12 / 419 - 2593 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0032
--- Epoch 13 / 419 - 2594 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0065
--- Epoch 14 / 419 - 2595 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0040
--- Epoch 15 / 419 - 2596 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0019
--- Epoch 16 / 419 - 2597 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0033
--- Epoch 17 / 419 - 2598 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0070
--- Epoch 18 / 419 - 2599 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0041
--- Epoch 19 / 419 - 2600 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0147
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0026
--- Epoch 20 / 419 - 2601 epochs total
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0023
--- Epoch 21 / 419 - 2602 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0067
--- Epoch 22 / 419 - 2603 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0070
--- Epoch 23 / 419 - 2604 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0208
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0016
--- Epoch 24 / 419 - 2605 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0038
--- Epoch 25 / 419 - 2606 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0044
--- Epoch 26 / 419 - 2607 epochs total
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0020
--- Epoch 27 / 419 - 2608 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0015
--- Epoch 28 / 419 - 2609 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0057
--- Epoch 29 / 419 - 2610 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0029
--- Epoch 30 / 419 - 2611 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0267
--- Epoch 31 / 419 - 2612 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0092
--- Epoch 32 / 419 - 2613 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0033
--- Epoch 33 / 419 - 2614 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0043
--- Epoch 34 / 419 - 2615 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0030
--- Epoch 35 / 419 - 2616 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0033
--- Epoch 36 / 419 - 2617 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0016
--- Epoch 37 / 419 - 2618 epochs total
Iteration 0, loss = 0.0126
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0506
Iteration 80, loss = 0.0043
--- Epoch 38 / 419 - 2619 epochs total
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0068
--- Epoch 39 / 419 - 2620 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0036
--- Epoch 40 / 419 - 2621 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0021
--- Epoch 41 / 419 - 2622 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0024
--- Epoch 42 / 419 - 2623 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0022
--- Epoch 43 / 419 - 2624 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0181
--- Epoch 44 / 419 - 2625 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0040
--- Epoch 45 / 419 - 2626 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0015
--- Epoch 46 / 419 - 2627 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0055
--- Epoch 47 / 419 - 2628 epochs total
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0061
--- Epoch 48 / 419 - 2629 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0063
---------------------------------------------------------------------------
KeyboardInterrupt                         Traceback (most recent call last)
<ipython-input-130-3d0cbeabd450> in <module>
----> 1 train(model11, optimizer, epochs=419, x_train=data["X_train_frog"],  y_train=data["y_train_frog"], criterion=nn.MSELoss())

<ipython-input-18-95dee9c67ab2> in train(model, optimizer, epochs, x_train, y_train, criterion)
     28             y = y_batch[t].to(device=device, dtype=dtype)
     29 
---> 30             scores = model(x)
     31 
     32             loss = criterion(scores.view(-1), y.view(-1))

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/module.py in _call_impl(self, *input, **kwargs)
    720             result = self._slow_forward(*input, **kwargs)
    721         else:
--> 722             result = self.forward(*input, **kwargs)
    723         for hook in itertools.chain(
    724                 _global_forward_hooks.values(),

<ipython-input-24-48b049d402e0> in forward(self, x)
     26         # Encoder
     27         scores = F.relu(self.batchnorm1(self.conv1(x)))
---> 28         scores = F.relu(self.batchnorm2(self.conv2(scores)))
     29         scores = F.relu(self.batchnorm3(self.conv3(scores)))
     30         scores = F.relu(self.batchnorm4(self.conv4(scores)))

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/module.py in _call_impl(self, *input, **kwargs)
    720             result = self._slow_forward(*input, **kwargs)
    721         else:
--> 722             result = self.forward(*input, **kwargs)
    723         for hook in itertools.chain(
    724                 _global_forward_hooks.values(),

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/batchnorm.py in forward(self, input)
    134             self.running_mean if not self.training or self.track_running_stats else None,
    135             self.running_var if not self.training or self.track_running_stats else None,
--> 136             self.weight, self.bias, bn_training, exponential_average_factor, self.eps)
    137 
    138 

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/functional.py in batch_norm(input, running_mean, running_var, weight, bias, training, momentum, eps)
   2014     return torch.batch_norm(
   2015         input, weight, bias, running_mean, running_var,
-> 2016         training, momentum, eps, torch.backends.cudnn.enabled
   2017     )
   2018 

KeyboardInterrupt: 
In [169]:
testModel(model11, x_test=data["X_test_frog"], y_test=data["y_test_frog"], criterion=nn.L1Loss())
In [52]:
learning_rate = 1e-2
model12 = ConvNet4()
optimizer = optim.SGD(model12.parameters(), lr=learning_rate)
In [124]:
train(model12, optimizer, epochs=1506, x_train=data["X_train_horse"],  y_train=data["y_train_horse"], criterion=nn.MSELoss())
--- Epoch 1 / 1506 - 1495 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0085
--- Epoch 2 / 1506 - 1496 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0037
--- Epoch 3 / 1506 - 1497 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0160
Iteration 80, loss = 0.0053
--- Epoch 4 / 1506 - 1498 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0053
--- Epoch 5 / 1506 - 1499 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0034
--- Epoch 6 / 1506 - 1500 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0033
--- Epoch 7 / 1506 - 1501 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0041
--- Epoch 8 / 1506 - 1502 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0042
--- Epoch 9 / 1506 - 1503 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0051
--- Epoch 10 / 1506 - 1504 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0025
--- Epoch 11 / 1506 - 1505 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0065
--- Epoch 12 / 1506 - 1506 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0022
--- Epoch 13 / 1506 - 1507 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0027
--- Epoch 14 / 1506 - 1508 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0026
--- Epoch 15 / 1506 - 1509 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0080
--- Epoch 16 / 1506 - 1510 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0054
--- Epoch 17 / 1506 - 1511 epochs total
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0030
--- Epoch 18 / 1506 - 1512 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0176
--- Epoch 19 / 1506 - 1513 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0054
--- Epoch 20 / 1506 - 1514 epochs total
Iteration 0, loss = 0.0139
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0027
--- Epoch 21 / 1506 - 1515 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0221
Iteration 80, loss = 0.0028
--- Epoch 22 / 1506 - 1516 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0093
--- Epoch 23 / 1506 - 1517 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0032
--- Epoch 24 / 1506 - 1518 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0339
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0041
--- Epoch 25 / 1506 - 1519 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0029
--- Epoch 26 / 1506 - 1520 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0028
--- Epoch 27 / 1506 - 1521 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0034
--- Epoch 28 / 1506 - 1522 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0068
--- Epoch 29 / 1506 - 1523 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0051
--- Epoch 30 / 1506 - 1524 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0031
--- Epoch 31 / 1506 - 1525 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0020
--- Epoch 32 / 1506 - 1526 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0066
--- Epoch 33 / 1506 - 1527 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0074
--- Epoch 34 / 1506 - 1528 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0035
--- Epoch 35 / 1506 - 1529 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0025
--- Epoch 36 / 1506 - 1530 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0050
--- Epoch 37 / 1506 - 1531 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0032
--- Epoch 38 / 1506 - 1532 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0034
--- Epoch 39 / 1506 - 1533 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0047
--- Epoch 40 / 1506 - 1534 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0141
--- Epoch 41 / 1506 - 1535 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0020
--- Epoch 42 / 1506 - 1536 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0036
--- Epoch 43 / 1506 - 1537 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0053
--- Epoch 44 / 1506 - 1538 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0077
--- Epoch 45 / 1506 - 1539 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0109
--- Epoch 46 / 1506 - 1540 epochs total
Iteration 0, loss = 0.0169
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0034
--- Epoch 47 / 1506 - 1541 epochs total
Iteration 0, loss = 0.0194
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0026
--- Epoch 48 / 1506 - 1542 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0026
--- Epoch 49 / 1506 - 1543 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0025
--- Epoch 50 / 1506 - 1544 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0226
--- Epoch 51 / 1506 - 1545 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0097
--- Epoch 52 / 1506 - 1546 epochs total
Iteration 0, loss = 0.0109
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0133
Iteration 80, loss = 0.0039
--- Epoch 53 / 1506 - 1547 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0016
--- Epoch 54 / 1506 - 1548 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0128
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0061
--- Epoch 55 / 1506 - 1549 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0039
--- Epoch 56 / 1506 - 1550 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0148
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0050
--- Epoch 57 / 1506 - 1551 epochs total
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0088
--- Epoch 58 / 1506 - 1552 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0029
--- Epoch 59 / 1506 - 1553 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0064
--- Epoch 60 / 1506 - 1554 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0172
--- Epoch 61 / 1506 - 1555 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0069
--- Epoch 62 / 1506 - 1556 epochs total
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0040
--- Epoch 63 / 1506 - 1557 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0148
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0046
--- Epoch 64 / 1506 - 1558 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0024
--- Epoch 65 / 1506 - 1559 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0022
--- Epoch 66 / 1506 - 1560 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0043
--- Epoch 67 / 1506 - 1561 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0086
--- Epoch 68 / 1506 - 1562 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0039
--- Epoch 69 / 1506 - 1563 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0035
--- Epoch 70 / 1506 - 1564 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0017
--- Epoch 71 / 1506 - 1565 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0026
--- Epoch 72 / 1506 - 1566 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0038
--- Epoch 73 / 1506 - 1567 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0059
--- Epoch 74 / 1506 - 1568 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0026
--- Epoch 75 / 1506 - 1569 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0041
--- Epoch 76 / 1506 - 1570 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0028
--- Epoch 77 / 1506 - 1571 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0224
--- Epoch 78 / 1506 - 1572 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0059
--- Epoch 79 / 1506 - 1573 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0035
--- Epoch 80 / 1506 - 1574 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0070
--- Epoch 81 / 1506 - 1575 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0141
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0049
--- Epoch 82 / 1506 - 1576 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0021
--- Epoch 83 / 1506 - 1577 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0042
--- Epoch 84 / 1506 - 1578 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0035
--- Epoch 85 / 1506 - 1579 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0022
--- Epoch 86 / 1506 - 1580 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0097
--- Epoch 87 / 1506 - 1581 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0023
--- Epoch 88 / 1506 - 1582 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0019
--- Epoch 89 / 1506 - 1583 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0051
--- Epoch 90 / 1506 - 1584 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0027
--- Epoch 91 / 1506 - 1585 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0018
--- Epoch 92 / 1506 - 1586 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0052
--- Epoch 93 / 1506 - 1587 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0040
--- Epoch 94 / 1506 - 1588 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0037
--- Epoch 95 / 1506 - 1589 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0028
--- Epoch 96 / 1506 - 1590 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0044
--- Epoch 97 / 1506 - 1591 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0028
--- Epoch 98 / 1506 - 1592 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0028
--- Epoch 99 / 1506 - 1593 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0056
--- Epoch 100 / 1506 - 1594 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0022
--- Epoch 101 / 1506 - 1595 epochs total
Iteration 0, loss = 0.0170
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0041
--- Epoch 102 / 1506 - 1596 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0062
--- Epoch 103 / 1506 - 1597 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0038
--- Epoch 104 / 1506 - 1598 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0056
--- Epoch 105 / 1506 - 1599 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0078
--- Epoch 106 / 1506 - 1600 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0047
--- Epoch 107 / 1506 - 1601 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0044
--- Epoch 108 / 1506 - 1602 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0031
--- Epoch 109 / 1506 - 1603 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0027
--- Epoch 110 / 1506 - 1604 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0037
--- Epoch 111 / 1506 - 1605 epochs total
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0017
--- Epoch 112 / 1506 - 1606 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0339
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0078
--- Epoch 113 / 1506 - 1607 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0038
--- Epoch 114 / 1506 - 1608 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0049
--- Epoch 115 / 1506 - 1609 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0123
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0033
--- Epoch 116 / 1506 - 1610 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0022
--- Epoch 117 / 1506 - 1611 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0024
--- Epoch 118 / 1506 - 1612 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0083
--- Epoch 119 / 1506 - 1613 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0030
--- Epoch 120 / 1506 - 1614 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0140
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0033
--- Epoch 121 / 1506 - 1615 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0033
--- Epoch 122 / 1506 - 1616 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0036
--- Epoch 123 / 1506 - 1617 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0059
--- Epoch 124 / 1506 - 1618 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0117
--- Epoch 125 / 1506 - 1619 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0148
--- Epoch 126 / 1506 - 1620 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0034
--- Epoch 127 / 1506 - 1621 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0060
--- Epoch 128 / 1506 - 1622 epochs total
Iteration 0, loss = 0.0223
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0026
--- Epoch 129 / 1506 - 1623 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0131
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0031
--- Epoch 130 / 1506 - 1624 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0028
--- Epoch 131 / 1506 - 1625 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0066
--- Epoch 132 / 1506 - 1626 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0027
--- Epoch 133 / 1506 - 1627 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0060
--- Epoch 134 / 1506 - 1628 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0041
--- Epoch 135 / 1506 - 1629 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0028
--- Epoch 136 / 1506 - 1630 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0052
--- Epoch 137 / 1506 - 1631 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0049
--- Epoch 138 / 1506 - 1632 epochs total
Iteration 0, loss = 0.0135
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0154
--- Epoch 139 / 1506 - 1633 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0032
--- Epoch 140 / 1506 - 1634 epochs total
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0023
--- Epoch 141 / 1506 - 1635 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0058
--- Epoch 142 / 1506 - 1636 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0024
--- Epoch 143 / 1506 - 1637 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0024
--- Epoch 144 / 1506 - 1638 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0011
--- Epoch 145 / 1506 - 1639 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0019
--- Epoch 146 / 1506 - 1640 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0083
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0040
--- Epoch 147 / 1506 - 1641 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0057
--- Epoch 148 / 1506 - 1642 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0069
--- Epoch 149 / 1506 - 1643 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0039
--- Epoch 150 / 1506 - 1644 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0035
--- Epoch 151 / 1506 - 1645 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0124
--- Epoch 152 / 1506 - 1646 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0018
--- Epoch 153 / 1506 - 1647 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0042
--- Epoch 154 / 1506 - 1648 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0044
--- Epoch 155 / 1506 - 1649 epochs total
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0032
--- Epoch 156 / 1506 - 1650 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0037
--- Epoch 157 / 1506 - 1651 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0043
--- Epoch 158 / 1506 - 1652 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0049
--- Epoch 159 / 1506 - 1653 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0038
--- Epoch 160 / 1506 - 1654 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0035
--- Epoch 161 / 1506 - 1655 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0040
--- Epoch 162 / 1506 - 1656 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0088
--- Epoch 163 / 1506 - 1657 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0064
--- Epoch 164 / 1506 - 1658 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0035
--- Epoch 165 / 1506 - 1659 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0080
--- Epoch 166 / 1506 - 1660 epochs total
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0032
--- Epoch 167 / 1506 - 1661 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0021
--- Epoch 168 / 1506 - 1662 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0052
--- Epoch 169 / 1506 - 1663 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0053
--- Epoch 170 / 1506 - 1664 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0090
--- Epoch 171 / 1506 - 1665 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0028
--- Epoch 172 / 1506 - 1666 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0039
--- Epoch 173 / 1506 - 1667 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0038
--- Epoch 174 / 1506 - 1668 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0082
--- Epoch 175 / 1506 - 1669 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0044
--- Epoch 176 / 1506 - 1670 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0191
--- Epoch 177 / 1506 - 1671 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0020
--- Epoch 178 / 1506 - 1672 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0026
--- Epoch 179 / 1506 - 1673 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0156
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0022
--- Epoch 180 / 1506 - 1674 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0053
--- Epoch 181 / 1506 - 1675 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0024
--- Epoch 182 / 1506 - 1676 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0035
--- Epoch 183 / 1506 - 1677 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0049
--- Epoch 184 / 1506 - 1678 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0069
--- Epoch 185 / 1506 - 1679 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0031
--- Epoch 186 / 1506 - 1680 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0050
--- Epoch 187 / 1506 - 1681 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0156
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0041
--- Epoch 188 / 1506 - 1682 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0044
--- Epoch 189 / 1506 - 1683 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0127
--- Epoch 190 / 1506 - 1684 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0111
--- Epoch 191 / 1506 - 1685 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0037
--- Epoch 192 / 1506 - 1686 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0138
Iteration 80, loss = 0.0090
--- Epoch 193 / 1506 - 1687 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0131
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0026
--- Epoch 194 / 1506 - 1688 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0024
--- Epoch 195 / 1506 - 1689 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0037
--- Epoch 196 / 1506 - 1690 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0026
--- Epoch 197 / 1506 - 1691 epochs total
Iteration 0, loss = 0.0284
Iteration 20, loss = 0.0129
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0036
--- Epoch 198 / 1506 - 1692 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0036
--- Epoch 199 / 1506 - 1693 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0020
--- Epoch 200 / 1506 - 1694 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0033
--- Epoch 201 / 1506 - 1695 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0156
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0040
--- Epoch 202 / 1506 - 1696 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0040
--- Epoch 203 / 1506 - 1697 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0129
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0019
--- Epoch 204 / 1506 - 1698 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0049
--- Epoch 205 / 1506 - 1699 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0042
--- Epoch 206 / 1506 - 1700 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0053
--- Epoch 207 / 1506 - 1701 epochs total
Iteration 0, loss = 0.0284
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0042
--- Epoch 208 / 1506 - 1702 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0042
--- Epoch 209 / 1506 - 1703 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0034
--- Epoch 210 / 1506 - 1704 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0027
--- Epoch 211 / 1506 - 1705 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0044
--- Epoch 212 / 1506 - 1706 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0124
--- Epoch 213 / 1506 - 1707 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0032
--- Epoch 214 / 1506 - 1708 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0098
--- Epoch 215 / 1506 - 1709 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0025
--- Epoch 216 / 1506 - 1710 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0032
--- Epoch 217 / 1506 - 1711 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0032
--- Epoch 218 / 1506 - 1712 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0025
--- Epoch 219 / 1506 - 1713 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0010
--- Epoch 220 / 1506 - 1714 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0031
--- Epoch 221 / 1506 - 1715 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0047
--- Epoch 222 / 1506 - 1716 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0042
--- Epoch 223 / 1506 - 1717 epochs total
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0060
--- Epoch 224 / 1506 - 1718 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0053
--- Epoch 225 / 1506 - 1719 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0044
--- Epoch 226 / 1506 - 1720 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0076
--- Epoch 227 / 1506 - 1721 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0068
--- Epoch 228 / 1506 - 1722 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0032
--- Epoch 229 / 1506 - 1723 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0176
--- Epoch 230 / 1506 - 1724 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0030
--- Epoch 231 / 1506 - 1725 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0020
--- Epoch 232 / 1506 - 1726 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0061
--- Epoch 233 / 1506 - 1727 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0037
--- Epoch 234 / 1506 - 1728 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0021
--- Epoch 235 / 1506 - 1729 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0091
--- Epoch 236 / 1506 - 1730 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0145
Iteration 80, loss = 0.0064
--- Epoch 237 / 1506 - 1731 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0107
--- Epoch 238 / 1506 - 1732 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0098
--- Epoch 239 / 1506 - 1733 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0023
--- Epoch 240 / 1506 - 1734 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0024
--- Epoch 241 / 1506 - 1735 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0050
--- Epoch 242 / 1506 - 1736 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0086
--- Epoch 243 / 1506 - 1737 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0021
--- Epoch 244 / 1506 - 1738 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0176
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0099
--- Epoch 245 / 1506 - 1739 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0029
--- Epoch 246 / 1506 - 1740 epochs total
Iteration 0, loss = 0.0153
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0024
--- Epoch 247 / 1506 - 1741 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0042
--- Epoch 248 / 1506 - 1742 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0028
--- Epoch 249 / 1506 - 1743 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0138
--- Epoch 250 / 1506 - 1744 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0028
--- Epoch 251 / 1506 - 1745 epochs total
Iteration 0, loss = 0.0083
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0079
--- Epoch 252 / 1506 - 1746 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0102
Iteration 80, loss = 0.0032
--- Epoch 253 / 1506 - 1747 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0043
--- Epoch 254 / 1506 - 1748 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0039
--- Epoch 255 / 1506 - 1749 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0066
--- Epoch 256 / 1506 - 1750 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0021
--- Epoch 257 / 1506 - 1751 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0036
--- Epoch 258 / 1506 - 1752 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0057
--- Epoch 259 / 1506 - 1753 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0057
--- Epoch 260 / 1506 - 1754 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0054
--- Epoch 261 / 1506 - 1755 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0193
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0069
--- Epoch 262 / 1506 - 1756 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0061
--- Epoch 263 / 1506 - 1757 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0018
--- Epoch 264 / 1506 - 1758 epochs total
Iteration 0, loss = 0.0127
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0040
--- Epoch 265 / 1506 - 1759 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0024
--- Epoch 266 / 1506 - 1760 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0050
--- Epoch 267 / 1506 - 1761 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0049
--- Epoch 268 / 1506 - 1762 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0023
--- Epoch 269 / 1506 - 1763 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0035
--- Epoch 270 / 1506 - 1764 epochs total
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0180
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0019
--- Epoch 271 / 1506 - 1765 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0039
--- Epoch 272 / 1506 - 1766 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0031
--- Epoch 273 / 1506 - 1767 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0046
--- Epoch 274 / 1506 - 1768 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0191
Iteration 80, loss = 0.0017
--- Epoch 275 / 1506 - 1769 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0034
--- Epoch 276 / 1506 - 1770 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0037
--- Epoch 277 / 1506 - 1771 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0254
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0023
--- Epoch 278 / 1506 - 1772 epochs total
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0230
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0057
--- Epoch 279 / 1506 - 1773 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0034
--- Epoch 280 / 1506 - 1774 epochs total
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0137
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0041
--- Epoch 281 / 1506 - 1775 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0164
Iteration 80, loss = 0.0050
--- Epoch 282 / 1506 - 1776 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0028
--- Epoch 283 / 1506 - 1777 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0054
--- Epoch 284 / 1506 - 1778 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0040
--- Epoch 285 / 1506 - 1779 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0338
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0044
--- Epoch 286 / 1506 - 1780 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0011
--- Epoch 287 / 1506 - 1781 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0035
--- Epoch 288 / 1506 - 1782 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0059
--- Epoch 289 / 1506 - 1783 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0072
--- Epoch 290 / 1506 - 1784 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0089
--- Epoch 291 / 1506 - 1785 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0194
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0045
--- Epoch 292 / 1506 - 1786 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0179
--- Epoch 293 / 1506 - 1787 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0048
--- Epoch 294 / 1506 - 1788 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0040
--- Epoch 295 / 1506 - 1789 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0031
--- Epoch 296 / 1506 - 1790 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0078
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0024
--- Epoch 297 / 1506 - 1791 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0023
--- Epoch 298 / 1506 - 1792 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0053
--- Epoch 299 / 1506 - 1793 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0040
--- Epoch 300 / 1506 - 1794 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0028
--- Epoch 301 / 1506 - 1795 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0047
--- Epoch 302 / 1506 - 1796 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0055
--- Epoch 303 / 1506 - 1797 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0022
--- Epoch 304 / 1506 - 1798 epochs total
Iteration 0, loss = 0.0083
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0034
--- Epoch 305 / 1506 - 1799 epochs total
Iteration 0, loss = 0.0083
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0032
--- Epoch 306 / 1506 - 1800 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0020
--- Epoch 307 / 1506 - 1801 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0037
--- Epoch 308 / 1506 - 1802 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0156
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0031
--- Epoch 309 / 1506 - 1803 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0036
--- Epoch 310 / 1506 - 1804 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0028
--- Epoch 311 / 1506 - 1805 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0017
--- Epoch 312 / 1506 - 1806 epochs total
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0024
--- Epoch 313 / 1506 - 1807 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0029
--- Epoch 314 / 1506 - 1808 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0042
--- Epoch 315 / 1506 - 1809 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0043
--- Epoch 316 / 1506 - 1810 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0044
--- Epoch 317 / 1506 - 1811 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0038
--- Epoch 318 / 1506 - 1812 epochs total
Iteration 0, loss = 0.0082
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0040
--- Epoch 319 / 1506 - 1813 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0052
--- Epoch 320 / 1506 - 1814 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0036
--- Epoch 321 / 1506 - 1815 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0253
Iteration 80, loss = 0.0082
--- Epoch 322 / 1506 - 1816 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0068
--- Epoch 323 / 1506 - 1817 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0020
--- Epoch 324 / 1506 - 1818 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0014
--- Epoch 325 / 1506 - 1819 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0032
--- Epoch 326 / 1506 - 1820 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0079
--- Epoch 327 / 1506 - 1821 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0024
--- Epoch 328 / 1506 - 1822 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0043
--- Epoch 329 / 1506 - 1823 epochs total
Iteration 0, loss = 0.0284
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0024
--- Epoch 330 / 1506 - 1824 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0020
--- Epoch 331 / 1506 - 1825 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0052
--- Epoch 332 / 1506 - 1826 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0021
--- Epoch 333 / 1506 - 1827 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0027
--- Epoch 334 / 1506 - 1828 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0032
--- Epoch 335 / 1506 - 1829 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0016
--- Epoch 336 / 1506 - 1830 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0044
--- Epoch 337 / 1506 - 1831 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0026
--- Epoch 338 / 1506 - 1832 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0035
--- Epoch 339 / 1506 - 1833 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0041
--- Epoch 340 / 1506 - 1834 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0022
--- Epoch 341 / 1506 - 1835 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0041
--- Epoch 342 / 1506 - 1836 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0029
--- Epoch 343 / 1506 - 1837 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0063
--- Epoch 344 / 1506 - 1838 epochs total
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0033
--- Epoch 345 / 1506 - 1839 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0284
Iteration 60, loss = 0.0133
Iteration 80, loss = 0.0060
--- Epoch 346 / 1506 - 1840 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0061
--- Epoch 347 / 1506 - 1841 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0112
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0036
--- Epoch 348 / 1506 - 1842 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0141
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0114
--- Epoch 349 / 1506 - 1843 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0036
--- Epoch 350 / 1506 - 1844 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0311
--- Epoch 351 / 1506 - 1845 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0014
--- Epoch 352 / 1506 - 1846 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0108
--- Epoch 353 / 1506 - 1847 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0120
--- Epoch 354 / 1506 - 1848 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0060
--- Epoch 355 / 1506 - 1849 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0088
--- Epoch 356 / 1506 - 1850 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0029
--- Epoch 357 / 1506 - 1851 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0039
--- Epoch 358 / 1506 - 1852 epochs total
Iteration 0, loss = 0.0281
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0024
--- Epoch 359 / 1506 - 1853 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0099
--- Epoch 360 / 1506 - 1854 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0018
--- Epoch 361 / 1506 - 1855 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0018
--- Epoch 362 / 1506 - 1856 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0027
--- Epoch 363 / 1506 - 1857 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0032
--- Epoch 364 / 1506 - 1858 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0037
--- Epoch 365 / 1506 - 1859 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0051
--- Epoch 366 / 1506 - 1860 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0080
--- Epoch 367 / 1506 - 1861 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0046
--- Epoch 368 / 1506 - 1862 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0042
--- Epoch 369 / 1506 - 1863 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0025
--- Epoch 370 / 1506 - 1864 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0036
--- Epoch 371 / 1506 - 1865 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0072
--- Epoch 372 / 1506 - 1866 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0013
--- Epoch 373 / 1506 - 1867 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0015
--- Epoch 374 / 1506 - 1868 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0066
--- Epoch 375 / 1506 - 1869 epochs total
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0024
--- Epoch 376 / 1506 - 1870 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0230
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0042
--- Epoch 377 / 1506 - 1871 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0021
--- Epoch 378 / 1506 - 1872 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0035
--- Epoch 379 / 1506 - 1873 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0092
--- Epoch 380 / 1506 - 1874 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0104
--- Epoch 381 / 1506 - 1875 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0106
--- Epoch 382 / 1506 - 1876 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0026
--- Epoch 383 / 1506 - 1877 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0112
--- Epoch 384 / 1506 - 1878 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0048
--- Epoch 385 / 1506 - 1879 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0028
--- Epoch 386 / 1506 - 1880 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0088
--- Epoch 387 / 1506 - 1881 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0054
--- Epoch 388 / 1506 - 1882 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0050
--- Epoch 389 / 1506 - 1883 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0039
--- Epoch 390 / 1506 - 1884 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0184
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0033
--- Epoch 391 / 1506 - 1885 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0049
--- Epoch 392 / 1506 - 1886 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0154
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0038
--- Epoch 393 / 1506 - 1887 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0230
Iteration 80, loss = 0.0020
--- Epoch 394 / 1506 - 1888 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0017
--- Epoch 395 / 1506 - 1889 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0021
--- Epoch 396 / 1506 - 1890 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0013
--- Epoch 397 / 1506 - 1891 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0051
--- Epoch 398 / 1506 - 1892 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0034
--- Epoch 399 / 1506 - 1893 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0020
--- Epoch 400 / 1506 - 1894 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0338
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0096
--- Epoch 401 / 1506 - 1895 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0026
--- Epoch 402 / 1506 - 1896 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0048
--- Epoch 403 / 1506 - 1897 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0045
--- Epoch 404 / 1506 - 1898 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0065
--- Epoch 405 / 1506 - 1899 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0031
--- Epoch 406 / 1506 - 1900 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0023
--- Epoch 407 / 1506 - 1901 epochs total
Iteration 0, loss = 0.0082
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0080
--- Epoch 408 / 1506 - 1902 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0040
--- Epoch 409 / 1506 - 1903 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0079
--- Epoch 410 / 1506 - 1904 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0044
--- Epoch 411 / 1506 - 1905 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0027
--- Epoch 412 / 1506 - 1906 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0148
--- Epoch 413 / 1506 - 1907 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0059
--- Epoch 414 / 1506 - 1908 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0083
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0011
--- Epoch 415 / 1506 - 1909 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0123
Iteration 80, loss = 0.0021
--- Epoch 416 / 1506 - 1910 epochs total
Iteration 0, loss = 0.0178
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0030
--- Epoch 417 / 1506 - 1911 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0039
--- Epoch 418 / 1506 - 1912 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0044
--- Epoch 419 / 1506 - 1913 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0100
--- Epoch 420 / 1506 - 1914 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0092
--- Epoch 421 / 1506 - 1915 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0032
--- Epoch 422 / 1506 - 1916 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0023
--- Epoch 423 / 1506 - 1917 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0020
--- Epoch 424 / 1506 - 1918 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0019
--- Epoch 425 / 1506 - 1919 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0043
--- Epoch 426 / 1506 - 1920 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0032
--- Epoch 427 / 1506 - 1921 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0055
--- Epoch 428 / 1506 - 1922 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0040
--- Epoch 429 / 1506 - 1923 epochs total
Iteration 0, loss = 0.0120
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0035
--- Epoch 430 / 1506 - 1924 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0034
--- Epoch 431 / 1506 - 1925 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0030
--- Epoch 432 / 1506 - 1926 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0028
--- Epoch 433 / 1506 - 1927 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0030
--- Epoch 434 / 1506 - 1928 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0038
--- Epoch 435 / 1506 - 1929 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0031
--- Epoch 436 / 1506 - 1930 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0026
--- Epoch 437 / 1506 - 1931 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0064
--- Epoch 438 / 1506 - 1932 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0034
--- Epoch 439 / 1506 - 1933 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0027
--- Epoch 440 / 1506 - 1934 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0028
--- Epoch 441 / 1506 - 1935 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0052
--- Epoch 442 / 1506 - 1936 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0032
--- Epoch 443 / 1506 - 1937 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0040
--- Epoch 444 / 1506 - 1938 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0059
--- Epoch 445 / 1506 - 1939 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0153
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0180
Iteration 80, loss = 0.0030
--- Epoch 446 / 1506 - 1940 epochs total
Iteration 0, loss = 0.0103
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0061
--- Epoch 447 / 1506 - 1941 epochs total
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0037
--- Epoch 448 / 1506 - 1942 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0064
--- Epoch 449 / 1506 - 1943 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0103
--- Epoch 450 / 1506 - 1944 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0137
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0067
--- Epoch 451 / 1506 - 1945 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0059
--- Epoch 452 / 1506 - 1946 epochs total
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0027
--- Epoch 453 / 1506 - 1947 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0281
--- Epoch 454 / 1506 - 1948 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0043
--- Epoch 455 / 1506 - 1949 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0129
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0022
--- Epoch 456 / 1506 - 1950 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0020
--- Epoch 457 / 1506 - 1951 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0031
--- Epoch 458 / 1506 - 1952 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0021
--- Epoch 459 / 1506 - 1953 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0131
Iteration 80, loss = 0.0066
--- Epoch 460 / 1506 - 1954 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0045
--- Epoch 461 / 1506 - 1955 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0026
--- Epoch 462 / 1506 - 1956 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0032
--- Epoch 463 / 1506 - 1957 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0059
--- Epoch 464 / 1506 - 1958 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0041
--- Epoch 465 / 1506 - 1959 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0042
--- Epoch 466 / 1506 - 1960 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0193
--- Epoch 467 / 1506 - 1961 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0043
--- Epoch 468 / 1506 - 1962 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0033
--- Epoch 469 / 1506 - 1963 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0051
--- Epoch 470 / 1506 - 1964 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0057
--- Epoch 471 / 1506 - 1965 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0024
--- Epoch 472 / 1506 - 1966 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0111
--- Epoch 473 / 1506 - 1967 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0072
--- Epoch 474 / 1506 - 1968 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0017
--- Epoch 475 / 1506 - 1969 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0045
--- Epoch 476 / 1506 - 1970 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0018
--- Epoch 477 / 1506 - 1971 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0034
--- Epoch 478 / 1506 - 1972 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0082
--- Epoch 479 / 1506 - 1973 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0024
--- Epoch 480 / 1506 - 1974 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0025
--- Epoch 481 / 1506 - 1975 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0038
--- Epoch 482 / 1506 - 1976 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0027
--- Epoch 483 / 1506 - 1977 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0028
--- Epoch 484 / 1506 - 1978 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0027
--- Epoch 485 / 1506 - 1979 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0092
--- Epoch 486 / 1506 - 1980 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0027
--- Epoch 487 / 1506 - 1981 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0029
--- Epoch 488 / 1506 - 1982 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0031
--- Epoch 489 / 1506 - 1983 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0018
--- Epoch 490 / 1506 - 1984 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0067
--- Epoch 491 / 1506 - 1985 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0172
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0038
--- Epoch 492 / 1506 - 1986 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0040
--- Epoch 493 / 1506 - 1987 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0041
--- Epoch 494 / 1506 - 1988 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0014
--- Epoch 495 / 1506 - 1989 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0014
--- Epoch 496 / 1506 - 1990 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0063
--- Epoch 497 / 1506 - 1991 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0060
--- Epoch 498 / 1506 - 1992 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0076
--- Epoch 499 / 1506 - 1993 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0033
--- Epoch 500 / 1506 - 1994 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0111
Iteration 80, loss = 0.0062
--- Epoch 501 / 1506 - 1995 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0187
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0036
--- Epoch 502 / 1506 - 1996 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0117
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0045
--- Epoch 503 / 1506 - 1997 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0068
--- Epoch 504 / 1506 - 1998 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0033
--- Epoch 505 / 1506 - 1999 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0035
--- Epoch 506 / 1506 - 2000 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0027
--- Epoch 507 / 1506 - 2001 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0023
--- Epoch 508 / 1506 - 2002 epochs total
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0048
--- Epoch 509 / 1506 - 2003 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0202
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0068
--- Epoch 510 / 1506 - 2004 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0032
--- Epoch 511 / 1506 - 2005 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0036
--- Epoch 512 / 1506 - 2006 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0035
--- Epoch 513 / 1506 - 2007 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0134
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0020
--- Epoch 514 / 1506 - 2008 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0042
--- Epoch 515 / 1506 - 2009 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0033
--- Epoch 516 / 1506 - 2010 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0030
--- Epoch 517 / 1506 - 2011 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0023
--- Epoch 518 / 1506 - 2012 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0030
--- Epoch 519 / 1506 - 2013 epochs total
Iteration 0, loss = 0.0184
Iteration 20, loss = 0.0127
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0070
--- Epoch 520 / 1506 - 2014 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0031
--- Epoch 521 / 1506 - 2015 epochs total
Iteration 0, loss = 0.0718
Iteration 20, loss = 0.0169
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0033
--- Epoch 522 / 1506 - 2016 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0021
--- Epoch 523 / 1506 - 2017 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0102
--- Epoch 524 / 1506 - 2018 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0031
--- Epoch 525 / 1506 - 2019 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0097
--- Epoch 526 / 1506 - 2020 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0050
--- Epoch 527 / 1506 - 2021 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0020
--- Epoch 528 / 1506 - 2022 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0153
--- Epoch 529 / 1506 - 2023 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0189
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0035
--- Epoch 530 / 1506 - 2024 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0040
--- Epoch 531 / 1506 - 2025 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0041
--- Epoch 532 / 1506 - 2026 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0038
--- Epoch 533 / 1506 - 2027 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0041
--- Epoch 534 / 1506 - 2028 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0041
--- Epoch 535 / 1506 - 2029 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0061
--- Epoch 536 / 1506 - 2030 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0026
--- Epoch 537 / 1506 - 2031 epochs total
Iteration 0, loss = 0.0136
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0043
--- Epoch 538 / 1506 - 2032 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0050
--- Epoch 539 / 1506 - 2033 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0032
--- Epoch 540 / 1506 - 2034 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0036
--- Epoch 541 / 1506 - 2035 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0035
--- Epoch 542 / 1506 - 2036 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0034
--- Epoch 543 / 1506 - 2037 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0034
--- Epoch 544 / 1506 - 2038 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0159
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0032
--- Epoch 545 / 1506 - 2039 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0026
--- Epoch 546 / 1506 - 2040 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0081
--- Epoch 547 / 1506 - 2041 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0036
--- Epoch 548 / 1506 - 2042 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0024
--- Epoch 549 / 1506 - 2043 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0028
--- Epoch 550 / 1506 - 2044 epochs total
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0071
--- Epoch 551 / 1506 - 2045 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0065
--- Epoch 552 / 1506 - 2046 epochs total
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0027
--- Epoch 553 / 1506 - 2047 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0051
--- Epoch 554 / 1506 - 2048 epochs total
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0104
--- Epoch 555 / 1506 - 2049 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0057
--- Epoch 556 / 1506 - 2050 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0023
--- Epoch 557 / 1506 - 2051 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0034
--- Epoch 558 / 1506 - 2052 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0024
--- Epoch 559 / 1506 - 2053 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0050
--- Epoch 560 / 1506 - 2054 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0054
--- Epoch 561 / 1506 - 2055 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0032
--- Epoch 562 / 1506 - 2056 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0059
--- Epoch 563 / 1506 - 2057 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0035
--- Epoch 564 / 1506 - 2058 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0052
--- Epoch 565 / 1506 - 2059 epochs total
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0133
--- Epoch 566 / 1506 - 2060 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0034
--- Epoch 567 / 1506 - 2061 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0028
--- Epoch 568 / 1506 - 2062 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0048
--- Epoch 569 / 1506 - 2063 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0042
--- Epoch 570 / 1506 - 2064 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0082
--- Epoch 571 / 1506 - 2065 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0025
--- Epoch 572 / 1506 - 2066 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0049
--- Epoch 573 / 1506 - 2067 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0030
--- Epoch 574 / 1506 - 2068 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0067
--- Epoch 575 / 1506 - 2069 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0038
--- Epoch 576 / 1506 - 2070 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0028
--- Epoch 577 / 1506 - 2071 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0032
--- Epoch 578 / 1506 - 2072 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0035
--- Epoch 579 / 1506 - 2073 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0117
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0027
--- Epoch 580 / 1506 - 2074 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0036
--- Epoch 581 / 1506 - 2075 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0043
--- Epoch 582 / 1506 - 2076 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0025
--- Epoch 583 / 1506 - 2077 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0030
--- Epoch 584 / 1506 - 2078 epochs total
Iteration 0, loss = 0.0120
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0053
--- Epoch 585 / 1506 - 2079 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0054
--- Epoch 586 / 1506 - 2080 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0024
--- Epoch 587 / 1506 - 2081 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0025
--- Epoch 588 / 1506 - 2082 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0052
--- Epoch 589 / 1506 - 2083 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0034
--- Epoch 590 / 1506 - 2084 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0027
--- Epoch 591 / 1506 - 2085 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0009
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0040
--- Epoch 592 / 1506 - 2086 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0065
--- Epoch 593 / 1506 - 2087 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0099
--- Epoch 594 / 1506 - 2088 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0033
--- Epoch 595 / 1506 - 2089 epochs total
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0065
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0037
--- Epoch 596 / 1506 - 2090 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0031
--- Epoch 597 / 1506 - 2091 epochs total
Iteration 0, loss = 0.0131
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0042
--- Epoch 598 / 1506 - 2092 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0116
--- Epoch 599 / 1506 - 2093 epochs total
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0023
--- Epoch 600 / 1506 - 2094 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0022
--- Epoch 601 / 1506 - 2095 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0083
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0079
--- Epoch 602 / 1506 - 2096 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0052
--- Epoch 603 / 1506 - 2097 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0065
--- Epoch 604 / 1506 - 2098 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0150
--- Epoch 605 / 1506 - 2099 epochs total
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0017
--- Epoch 606 / 1506 - 2100 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0019
--- Epoch 607 / 1506 - 2101 epochs total
Iteration 0, loss = 0.0083
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0062
--- Epoch 608 / 1506 - 2102 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0045
--- Epoch 609 / 1506 - 2103 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0028
--- Epoch 610 / 1506 - 2104 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0034
--- Epoch 611 / 1506 - 2105 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0089
--- Epoch 612 / 1506 - 2106 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0033
--- Epoch 613 / 1506 - 2107 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0026
--- Epoch 614 / 1506 - 2108 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0037
--- Epoch 615 / 1506 - 2109 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0192
Iteration 80, loss = 0.0018
--- Epoch 616 / 1506 - 2110 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0110
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0064
--- Epoch 617 / 1506 - 2111 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0030
--- Epoch 618 / 1506 - 2112 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0027
--- Epoch 619 / 1506 - 2113 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0063
--- Epoch 620 / 1506 - 2114 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0025
--- Epoch 621 / 1506 - 2115 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0108
--- Epoch 622 / 1506 - 2116 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0052
--- Epoch 623 / 1506 - 2117 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0049
--- Epoch 624 / 1506 - 2118 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0055
--- Epoch 625 / 1506 - 2119 epochs total
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0040
--- Epoch 626 / 1506 - 2120 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0133
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0054
--- Epoch 627 / 1506 - 2121 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0027
--- Epoch 628 / 1506 - 2122 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0063
--- Epoch 629 / 1506 - 2123 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0034
--- Epoch 630 / 1506 - 2124 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0029
--- Epoch 631 / 1506 - 2125 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0041
--- Epoch 632 / 1506 - 2126 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0055
--- Epoch 633 / 1506 - 2127 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0053
--- Epoch 634 / 1506 - 2128 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0080
--- Epoch 635 / 1506 - 2129 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0040
--- Epoch 636 / 1506 - 2130 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0071
--- Epoch 637 / 1506 - 2131 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0037
--- Epoch 638 / 1506 - 2132 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0071
--- Epoch 639 / 1506 - 2133 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0036
--- Epoch 640 / 1506 - 2134 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0046
--- Epoch 641 / 1506 - 2135 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0052
--- Epoch 642 / 1506 - 2136 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0046
--- Epoch 643 / 1506 - 2137 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0029
--- Epoch 644 / 1506 - 2138 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0020
--- Epoch 645 / 1506 - 2139 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0017
--- Epoch 646 / 1506 - 2140 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0196
--- Epoch 647 / 1506 - 2141 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0030
--- Epoch 648 / 1506 - 2142 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0058
--- Epoch 649 / 1506 - 2143 epochs total
Iteration 0, loss = 0.0223
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0050
--- Epoch 650 / 1506 - 2144 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0042
--- Epoch 651 / 1506 - 2145 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0203
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0035
--- Epoch 652 / 1506 - 2146 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0104
--- Epoch 653 / 1506 - 2147 epochs total
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0039
--- Epoch 654 / 1506 - 2148 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0015
--- Epoch 655 / 1506 - 2149 epochs total
Iteration 0, loss = 0.0185
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0030
--- Epoch 656 / 1506 - 2150 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0036
--- Epoch 657 / 1506 - 2151 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0103
--- Epoch 658 / 1506 - 2152 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0043
--- Epoch 659 / 1506 - 2153 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0217
--- Epoch 660 / 1506 - 2154 epochs total
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0031
--- Epoch 661 / 1506 - 2155 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0039
--- Epoch 662 / 1506 - 2156 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0039
--- Epoch 663 / 1506 - 2157 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0032
--- Epoch 664 / 1506 - 2158 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0025
--- Epoch 665 / 1506 - 2159 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0041
--- Epoch 666 / 1506 - 2160 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0031
--- Epoch 667 / 1506 - 2161 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0109
--- Epoch 668 / 1506 - 2162 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0032
--- Epoch 669 / 1506 - 2163 epochs total
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0052
--- Epoch 670 / 1506 - 2164 epochs total
Iteration 0, loss = 0.0083
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0043
--- Epoch 671 / 1506 - 2165 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0059
--- Epoch 672 / 1506 - 2166 epochs total
Iteration 0, loss = 0.0136
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0084
--- Epoch 673 / 1506 - 2167 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0048
--- Epoch 674 / 1506 - 2168 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0019
--- Epoch 675 / 1506 - 2169 epochs total
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0046
--- Epoch 676 / 1506 - 2170 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0049
--- Epoch 677 / 1506 - 2171 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0040
--- Epoch 678 / 1506 - 2172 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0066
--- Epoch 679 / 1506 - 2173 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0064
--- Epoch 680 / 1506 - 2174 epochs total
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0122
--- Epoch 681 / 1506 - 2175 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0062
--- Epoch 682 / 1506 - 2176 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0042
--- Epoch 683 / 1506 - 2177 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0010
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0055
--- Epoch 684 / 1506 - 2178 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0072
--- Epoch 685 / 1506 - 2179 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0026
--- Epoch 686 / 1506 - 2180 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0079
--- Epoch 687 / 1506 - 2181 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0122
--- Epoch 688 / 1506 - 2182 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0038
--- Epoch 689 / 1506 - 2183 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0034
--- Epoch 690 / 1506 - 2184 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0021
--- Epoch 691 / 1506 - 2185 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0253
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0061
--- Epoch 692 / 1506 - 2186 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0049
--- Epoch 693 / 1506 - 2187 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0074
--- Epoch 694 / 1506 - 2188 epochs total
Iteration 0, loss = 0.0254
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0268
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0040
--- Epoch 695 / 1506 - 2189 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0024
--- Epoch 696 / 1506 - 2190 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0028
--- Epoch 697 / 1506 - 2191 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0033
--- Epoch 698 / 1506 - 2192 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0023
--- Epoch 699 / 1506 - 2193 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0078
--- Epoch 700 / 1506 - 2194 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0045
--- Epoch 701 / 1506 - 2195 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0054
--- Epoch 702 / 1506 - 2196 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0019
--- Epoch 703 / 1506 - 2197 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0136
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0019
--- Epoch 704 / 1506 - 2198 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0014
--- Epoch 705 / 1506 - 2199 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0016
--- Epoch 706 / 1506 - 2200 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0049
--- Epoch 707 / 1506 - 2201 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0193
Iteration 80, loss = 0.0206
--- Epoch 708 / 1506 - 2202 epochs total
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0036
--- Epoch 709 / 1506 - 2203 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0025
--- Epoch 710 / 1506 - 2204 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0069
--- Epoch 711 / 1506 - 2205 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0037
--- Epoch 712 / 1506 - 2206 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0038
--- Epoch 713 / 1506 - 2207 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0041
--- Epoch 714 / 1506 - 2208 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0073
--- Epoch 715 / 1506 - 2209 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0064
--- Epoch 716 / 1506 - 2210 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0082
--- Epoch 717 / 1506 - 2211 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0029
--- Epoch 718 / 1506 - 2212 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0133
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0052
--- Epoch 719 / 1506 - 2213 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0178
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0036
--- Epoch 720 / 1506 - 2214 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0067
--- Epoch 721 / 1506 - 2215 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0031
--- Epoch 722 / 1506 - 2216 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0154
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0028
--- Epoch 723 / 1506 - 2217 epochs total
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0038
--- Epoch 724 / 1506 - 2218 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0159
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0059
--- Epoch 725 / 1506 - 2219 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0059
--- Epoch 726 / 1506 - 2220 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0184
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0013
--- Epoch 727 / 1506 - 2221 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0032
--- Epoch 728 / 1506 - 2222 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0082
--- Epoch 729 / 1506 - 2223 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0086
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0042
--- Epoch 730 / 1506 - 2224 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0036
--- Epoch 731 / 1506 - 2225 epochs total
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0284
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0043
--- Epoch 732 / 1506 - 2226 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0035
--- Epoch 733 / 1506 - 2227 epochs total
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0036
--- Epoch 734 / 1506 - 2228 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0027
--- Epoch 735 / 1506 - 2229 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0041
--- Epoch 736 / 1506 - 2230 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0064
--- Epoch 737 / 1506 - 2231 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0035
--- Epoch 738 / 1506 - 2232 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0041
--- Epoch 739 / 1506 - 2233 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0032
--- Epoch 740 / 1506 - 2234 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0027
--- Epoch 741 / 1506 - 2235 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0030
--- Epoch 742 / 1506 - 2236 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0077
--- Epoch 743 / 1506 - 2237 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0046
--- Epoch 744 / 1506 - 2238 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0045
--- Epoch 745 / 1506 - 2239 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0025
--- Epoch 746 / 1506 - 2240 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0025
--- Epoch 747 / 1506 - 2241 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0023
--- Epoch 748 / 1506 - 2242 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0035
--- Epoch 749 / 1506 - 2243 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0025
--- Epoch 750 / 1506 - 2244 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0047
--- Epoch 751 / 1506 - 2245 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0095
--- Epoch 752 / 1506 - 2246 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0018
--- Epoch 753 / 1506 - 2247 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0200
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0024
--- Epoch 754 / 1506 - 2248 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0024
--- Epoch 755 / 1506 - 2249 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0034
--- Epoch 756 / 1506 - 2250 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0154
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0027
--- Epoch 757 / 1506 - 2251 epochs total
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0075
--- Epoch 758 / 1506 - 2252 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0040
--- Epoch 759 / 1506 - 2253 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0137
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0076
--- Epoch 760 / 1506 - 2254 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0039
--- Epoch 761 / 1506 - 2255 epochs total
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0015
--- Epoch 762 / 1506 - 2256 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0184
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0053
--- Epoch 763 / 1506 - 2257 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0179
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0028
--- Epoch 764 / 1506 - 2258 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0040
--- Epoch 765 / 1506 - 2259 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0046
--- Epoch 766 / 1506 - 2260 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0056
--- Epoch 767 / 1506 - 2261 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0024
--- Epoch 768 / 1506 - 2262 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0054
--- Epoch 769 / 1506 - 2263 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0027
--- Epoch 770 / 1506 - 2264 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0035
--- Epoch 771 / 1506 - 2265 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0021
--- Epoch 772 / 1506 - 2266 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0039
--- Epoch 773 / 1506 - 2267 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0221
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0035
--- Epoch 774 / 1506 - 2268 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0035
--- Epoch 775 / 1506 - 2269 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0051
--- Epoch 776 / 1506 - 2270 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0088
--- Epoch 777 / 1506 - 2271 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0159
--- Epoch 778 / 1506 - 2272 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0057
--- Epoch 779 / 1506 - 2273 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0048
--- Epoch 780 / 1506 - 2274 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0032
--- Epoch 781 / 1506 - 2275 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0254
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0223
--- Epoch 782 / 1506 - 2276 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0072
--- Epoch 783 / 1506 - 2277 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0018
--- Epoch 784 / 1506 - 2278 epochs total
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0037
--- Epoch 785 / 1506 - 2279 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0037
--- Epoch 786 / 1506 - 2280 epochs total
Iteration 0, loss = 0.0141
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0043
--- Epoch 787 / 1506 - 2281 epochs total
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0097
--- Epoch 788 / 1506 - 2282 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0035
--- Epoch 789 / 1506 - 2283 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0053
--- Epoch 790 / 1506 - 2284 epochs total
Iteration 0, loss = 0.0178
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0172
--- Epoch 791 / 1506 - 2285 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0057
--- Epoch 792 / 1506 - 2286 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0028
--- Epoch 793 / 1506 - 2287 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0054
--- Epoch 794 / 1506 - 2288 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0049
--- Epoch 795 / 1506 - 2289 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0031
--- Epoch 796 / 1506 - 2290 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0047
--- Epoch 797 / 1506 - 2291 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0138
Iteration 80, loss = 0.0059
--- Epoch 798 / 1506 - 2292 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0013
--- Epoch 799 / 1506 - 2293 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0044
--- Epoch 800 / 1506 - 2294 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0039
--- Epoch 801 / 1506 - 2295 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0061
--- Epoch 802 / 1506 - 2296 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0039
--- Epoch 803 / 1506 - 2297 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0034
--- Epoch 804 / 1506 - 2298 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0029
--- Epoch 805 / 1506 - 2299 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0021
--- Epoch 806 / 1506 - 2300 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0021
--- Epoch 807 / 1506 - 2301 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0030
--- Epoch 808 / 1506 - 2302 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0035
--- Epoch 809 / 1506 - 2303 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0023
--- Epoch 810 / 1506 - 2304 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0032
--- Epoch 811 / 1506 - 2305 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0032
--- Epoch 812 / 1506 - 2306 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0045
--- Epoch 813 / 1506 - 2307 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0053
--- Epoch 814 / 1506 - 2308 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0023
--- Epoch 815 / 1506 - 2309 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0052
--- Epoch 816 / 1506 - 2310 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0159
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0075
--- Epoch 817 / 1506 - 2311 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0053
--- Epoch 818 / 1506 - 2312 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0123
Iteration 80, loss = 0.0028
--- Epoch 819 / 1506 - 2313 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0072
--- Epoch 820 / 1506 - 2314 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0043
--- Epoch 821 / 1506 - 2315 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0119
--- Epoch 822 / 1506 - 2316 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0067
--- Epoch 823 / 1506 - 2317 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0189
--- Epoch 824 / 1506 - 2318 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0025
--- Epoch 825 / 1506 - 2319 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0041
--- Epoch 826 / 1506 - 2320 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0026
--- Epoch 827 / 1506 - 2321 epochs total
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0086
--- Epoch 828 / 1506 - 2322 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0082
--- Epoch 829 / 1506 - 2323 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0180
Iteration 80, loss = 0.0028
--- Epoch 830 / 1506 - 2324 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0226
Iteration 80, loss = 0.0020
--- Epoch 831 / 1506 - 2325 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0030
--- Epoch 832 / 1506 - 2326 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0059
--- Epoch 833 / 1506 - 2327 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0116
--- Epoch 834 / 1506 - 2328 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0222
--- Epoch 835 / 1506 - 2329 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0019
--- Epoch 836 / 1506 - 2330 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0128
--- Epoch 837 / 1506 - 2331 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0037
--- Epoch 838 / 1506 - 2332 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0038
--- Epoch 839 / 1506 - 2333 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0023
--- Epoch 840 / 1506 - 2334 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0082
--- Epoch 841 / 1506 - 2335 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0043
--- Epoch 842 / 1506 - 2336 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0054
--- Epoch 843 / 1506 - 2337 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0030
--- Epoch 844 / 1506 - 2338 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0191
Iteration 80, loss = 0.0067
--- Epoch 845 / 1506 - 2339 epochs total
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0040
--- Epoch 846 / 1506 - 2340 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0036
--- Epoch 847 / 1506 - 2341 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0042
--- Epoch 848 / 1506 - 2342 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0045
--- Epoch 849 / 1506 - 2343 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0035
--- Epoch 850 / 1506 - 2344 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0065
--- Epoch 851 / 1506 - 2345 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0035
--- Epoch 852 / 1506 - 2346 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0046
--- Epoch 853 / 1506 - 2347 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0180
--- Epoch 854 / 1506 - 2348 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0030
--- Epoch 855 / 1506 - 2349 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0026
--- Epoch 856 / 1506 - 2350 epochs total
Iteration 0, loss = 0.0120
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0104
--- Epoch 857 / 1506 - 2351 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0053
--- Epoch 858 / 1506 - 2352 epochs total
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0126
--- Epoch 859 / 1506 - 2353 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0056
--- Epoch 860 / 1506 - 2354 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0057
--- Epoch 861 / 1506 - 2355 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0027
--- Epoch 862 / 1506 - 2356 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0253
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0052
--- Epoch 863 / 1506 - 2357 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0281
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0073
--- Epoch 864 / 1506 - 2358 epochs total
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0032
--- Epoch 865 / 1506 - 2359 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0192
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0052
--- Epoch 866 / 1506 - 2360 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0048
--- Epoch 867 / 1506 - 2361 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0010
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0034
--- Epoch 868 / 1506 - 2362 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0036
--- Epoch 869 / 1506 - 2363 epochs total
Iteration 0, loss = 0.0214
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0079
--- Epoch 870 / 1506 - 2364 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0041
--- Epoch 871 / 1506 - 2365 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0017
--- Epoch 872 / 1506 - 2366 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0054
--- Epoch 873 / 1506 - 2367 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0027
--- Epoch 874 / 1506 - 2368 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0033
--- Epoch 875 / 1506 - 2369 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0049
--- Epoch 876 / 1506 - 2370 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0037
--- Epoch 877 / 1506 - 2371 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0027
--- Epoch 878 / 1506 - 2372 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0047
--- Epoch 879 / 1506 - 2373 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0123
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0038
--- Epoch 880 / 1506 - 2374 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0065
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0024
--- Epoch 881 / 1506 - 2375 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0098
--- Epoch 882 / 1506 - 2376 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0027
--- Epoch 883 / 1506 - 2377 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0053
--- Epoch 884 / 1506 - 2378 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0137
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0026
--- Epoch 885 / 1506 - 2379 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0031
--- Epoch 886 / 1506 - 2380 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0029
--- Epoch 887 / 1506 - 2381 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0138
--- Epoch 888 / 1506 - 2382 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0031
--- Epoch 889 / 1506 - 2383 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0025
--- Epoch 890 / 1506 - 2384 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0062
--- Epoch 891 / 1506 - 2385 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0109
--- Epoch 892 / 1506 - 2386 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0023
--- Epoch 893 / 1506 - 2387 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0044
--- Epoch 894 / 1506 - 2388 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0033
--- Epoch 895 / 1506 - 2389 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0059
--- Epoch 896 / 1506 - 2390 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0041
--- Epoch 897 / 1506 - 2391 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0046
--- Epoch 898 / 1506 - 2392 epochs total
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0046
--- Epoch 899 / 1506 - 2393 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0043
--- Epoch 900 / 1506 - 2394 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0184
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0025
--- Epoch 901 / 1506 - 2395 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0029
--- Epoch 902 / 1506 - 2396 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0024
--- Epoch 903 / 1506 - 2397 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0025
--- Epoch 904 / 1506 - 2398 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0034
--- Epoch 905 / 1506 - 2399 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0027
--- Epoch 906 / 1506 - 2400 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0165
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0018
--- Epoch 907 / 1506 - 2401 epochs total
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0031
--- Epoch 908 / 1506 - 2402 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0026
--- Epoch 909 / 1506 - 2403 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0055
--- Epoch 910 / 1506 - 2404 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0043
--- Epoch 911 / 1506 - 2405 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0030
--- Epoch 912 / 1506 - 2406 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0060
--- Epoch 913 / 1506 - 2407 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0031
--- Epoch 914 / 1506 - 2408 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0025
--- Epoch 915 / 1506 - 2409 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0052
--- Epoch 916 / 1506 - 2410 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0018
--- Epoch 917 / 1506 - 2411 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0019
--- Epoch 918 / 1506 - 2412 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0040
--- Epoch 919 / 1506 - 2413 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0185
--- Epoch 920 / 1506 - 2414 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0060
--- Epoch 921 / 1506 - 2415 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0029
--- Epoch 922 / 1506 - 2416 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0025
--- Epoch 923 / 1506 - 2417 epochs total
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0031
--- Epoch 924 / 1506 - 2418 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0052
--- Epoch 925 / 1506 - 2419 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0030
--- Epoch 926 / 1506 - 2420 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0035
--- Epoch 927 / 1506 - 2421 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0038
--- Epoch 928 / 1506 - 2422 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0032
--- Epoch 929 / 1506 - 2423 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0025
--- Epoch 930 / 1506 - 2424 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0077
--- Epoch 931 / 1506 - 2425 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0043
--- Epoch 932 / 1506 - 2426 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0047
--- Epoch 933 / 1506 - 2427 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0017
--- Epoch 934 / 1506 - 2428 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0027
--- Epoch 935 / 1506 - 2429 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0077
--- Epoch 936 / 1506 - 2430 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0088
--- Epoch 937 / 1506 - 2431 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0053
--- Epoch 938 / 1506 - 2432 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0027
--- Epoch 939 / 1506 - 2433 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0078
--- Epoch 940 / 1506 - 2434 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0055
--- Epoch 941 / 1506 - 2435 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0040
--- Epoch 942 / 1506 - 2436 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0036
--- Epoch 943 / 1506 - 2437 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0032
--- Epoch 944 / 1506 - 2438 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0122
--- Epoch 945 / 1506 - 2439 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0024
--- Epoch 946 / 1506 - 2440 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0022
--- Epoch 947 / 1506 - 2441 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0031
--- Epoch 948 / 1506 - 2442 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0075
--- Epoch 949 / 1506 - 2443 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0113
--- Epoch 950 / 1506 - 2444 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0032
--- Epoch 951 / 1506 - 2445 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0024
--- Epoch 952 / 1506 - 2446 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0057
--- Epoch 953 / 1506 - 2447 epochs total
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0030
--- Epoch 954 / 1506 - 2448 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0034
--- Epoch 955 / 1506 - 2449 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0069
--- Epoch 956 / 1506 - 2450 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0041
--- Epoch 957 / 1506 - 2451 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0091
--- Epoch 958 / 1506 - 2452 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0035
--- Epoch 959 / 1506 - 2453 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0039
--- Epoch 960 / 1506 - 2454 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0042
--- Epoch 961 / 1506 - 2455 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0032
--- Epoch 962 / 1506 - 2456 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0280
--- Epoch 963 / 1506 - 2457 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0035
--- Epoch 964 / 1506 - 2458 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0031
--- Epoch 965 / 1506 - 2459 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0032
--- Epoch 966 / 1506 - 2460 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0064
--- Epoch 967 / 1506 - 2461 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0041
--- Epoch 968 / 1506 - 2462 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0055
--- Epoch 969 / 1506 - 2463 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0055
--- Epoch 970 / 1506 - 2464 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0045
--- Epoch 971 / 1506 - 2465 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0028
--- Epoch 972 / 1506 - 2466 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0042
--- Epoch 973 / 1506 - 2467 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0034
--- Epoch 974 / 1506 - 2468 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0051
--- Epoch 975 / 1506 - 2469 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0070
--- Epoch 976 / 1506 - 2470 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0041
--- Epoch 977 / 1506 - 2471 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0121
Iteration 80, loss = 0.0032
--- Epoch 978 / 1506 - 2472 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0068
--- Epoch 979 / 1506 - 2473 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0047
--- Epoch 980 / 1506 - 2474 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0009
Iteration 80, loss = 0.0060
--- Epoch 981 / 1506 - 2475 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0055
--- Epoch 982 / 1506 - 2476 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0045
--- Epoch 983 / 1506 - 2477 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0037
--- Epoch 984 / 1506 - 2478 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0024
--- Epoch 985 / 1506 - 2479 epochs total
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0012
--- Epoch 986 / 1506 - 2480 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0057
--- Epoch 987 / 1506 - 2481 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0027
--- Epoch 988 / 1506 - 2482 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0024
--- Epoch 989 / 1506 - 2483 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0063
--- Epoch 990 / 1506 - 2484 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0040
--- Epoch 991 / 1506 - 2485 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0086
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0036
--- Epoch 992 / 1506 - 2486 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0043
--- Epoch 993 / 1506 - 2487 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0063
--- Epoch 994 / 1506 - 2488 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0074
--- Epoch 995 / 1506 - 2489 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0193
Iteration 80, loss = 0.0030
--- Epoch 996 / 1506 - 2490 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0037
--- Epoch 997 / 1506 - 2491 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0026
--- Epoch 998 / 1506 - 2492 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0111
--- Epoch 999 / 1506 - 2493 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0027
--- Epoch 1000 / 1506 - 2494 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0020
--- Epoch 1001 / 1506 - 2495 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0071
--- Epoch 1002 / 1506 - 2496 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0048
--- Epoch 1003 / 1506 - 2497 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0040
--- Epoch 1004 / 1506 - 2498 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0016
--- Epoch 1005 / 1506 - 2499 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0018
--- Epoch 1006 / 1506 - 2500 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0036
--- Epoch 1007 / 1506 - 2501 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0036
--- Epoch 1008 / 1506 - 2502 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0047
--- Epoch 1009 / 1506 - 2503 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0035
--- Epoch 1010 / 1506 - 2504 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0069
--- Epoch 1011 / 1506 - 2505 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0133
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0210
Iteration 80, loss = 0.0117
--- Epoch 1012 / 1506 - 2506 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0020
--- Epoch 1013 / 1506 - 2507 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0050
--- Epoch 1014 / 1506 - 2508 epochs total
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0020
--- Epoch 1015 / 1506 - 2509 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0042
--- Epoch 1016 / 1506 - 2510 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0028
--- Epoch 1017 / 1506 - 2511 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0058
--- Epoch 1018 / 1506 - 2512 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0036
--- Epoch 1019 / 1506 - 2513 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0048
--- Epoch 1020 / 1506 - 2514 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0157
Iteration 80, loss = 0.0089
--- Epoch 1021 / 1506 - 2515 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0023
--- Epoch 1022 / 1506 - 2516 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0044
--- Epoch 1023 / 1506 - 2517 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0133
Iteration 80, loss = 0.0038
--- Epoch 1024 / 1506 - 2518 epochs total
Iteration 0, loss = 0.0214
Iteration 20, loss = 0.0124
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0062
--- Epoch 1025 / 1506 - 2519 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0086
--- Epoch 1026 / 1506 - 2520 epochs total
Iteration 0, loss = 0.0213
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0056
--- Epoch 1027 / 1506 - 2521 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0099
--- Epoch 1028 / 1506 - 2522 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0023
--- Epoch 1029 / 1506 - 2523 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0031
--- Epoch 1030 / 1506 - 2524 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0024
--- Epoch 1031 / 1506 - 2525 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0025
--- Epoch 1032 / 1506 - 2526 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0020
--- Epoch 1033 / 1506 - 2527 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0032
--- Epoch 1034 / 1506 - 2528 epochs total
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0064
--- Epoch 1035 / 1506 - 2529 epochs total
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0089
--- Epoch 1036 / 1506 - 2530 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0056
--- Epoch 1037 / 1506 - 2531 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0054
--- Epoch 1038 / 1506 - 2532 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0060
--- Epoch 1039 / 1506 - 2533 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0037
--- Epoch 1040 / 1506 - 2534 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0032
--- Epoch 1041 / 1506 - 2535 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0044
--- Epoch 1042 / 1506 - 2536 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0040
--- Epoch 1043 / 1506 - 2537 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0042
--- Epoch 1044 / 1506 - 2538 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0022
--- Epoch 1045 / 1506 - 2539 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0051
--- Epoch 1046 / 1506 - 2540 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0020
--- Epoch 1047 / 1506 - 2541 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0040
--- Epoch 1048 / 1506 - 2542 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0020
--- Epoch 1049 / 1506 - 2543 epochs total
Iteration 0, loss = 0.0131
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0074
--- Epoch 1050 / 1506 - 2544 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0058
--- Epoch 1051 / 1506 - 2545 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0062
--- Epoch 1052 / 1506 - 2546 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0084
--- Epoch 1053 / 1506 - 2547 epochs total
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0133
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0061
--- Epoch 1054 / 1506 - 2548 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0056
--- Epoch 1055 / 1506 - 2549 epochs total
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0060
--- Epoch 1056 / 1506 - 2550 epochs total
Iteration 0, loss = 0.0150
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0040
--- Epoch 1057 / 1506 - 2551 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0033
--- Epoch 1058 / 1506 - 2552 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0078
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0019
--- Epoch 1059 / 1506 - 2553 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0070
--- Epoch 1060 / 1506 - 2554 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0172
Iteration 80, loss = 0.0061
--- Epoch 1061 / 1506 - 2555 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0018
--- Epoch 1062 / 1506 - 2556 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0044
--- Epoch 1063 / 1506 - 2557 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0138
--- Epoch 1064 / 1506 - 2558 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0029
--- Epoch 1065 / 1506 - 2559 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0046
--- Epoch 1066 / 1506 - 2560 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0030
--- Epoch 1067 / 1506 - 2561 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0029
--- Epoch 1068 / 1506 - 2562 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0059
--- Epoch 1069 / 1506 - 2563 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0029
--- Epoch 1070 / 1506 - 2564 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0060
--- Epoch 1071 / 1506 - 2565 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0045
--- Epoch 1072 / 1506 - 2566 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0034
--- Epoch 1073 / 1506 - 2567 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0037
--- Epoch 1074 / 1506 - 2568 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0032
--- Epoch 1075 / 1506 - 2569 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0035
--- Epoch 1076 / 1506 - 2570 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0068
--- Epoch 1077 / 1506 - 2571 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0123
Iteration 80, loss = 0.0056
--- Epoch 1078 / 1506 - 2572 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0031
--- Epoch 1079 / 1506 - 2573 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0014
--- Epoch 1080 / 1506 - 2574 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0056
--- Epoch 1081 / 1506 - 2575 epochs total
Iteration 0, loss = 0.0082
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0222
--- Epoch 1082 / 1506 - 2576 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0062
--- Epoch 1083 / 1506 - 2577 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0068
--- Epoch 1084 / 1506 - 2578 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0050
--- Epoch 1085 / 1506 - 2579 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0034
--- Epoch 1086 / 1506 - 2580 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0047
--- Epoch 1087 / 1506 - 2581 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0058
--- Epoch 1088 / 1506 - 2582 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0025
--- Epoch 1089 / 1506 - 2583 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0034
--- Epoch 1090 / 1506 - 2584 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0046
--- Epoch 1091 / 1506 - 2585 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0033
--- Epoch 1092 / 1506 - 2586 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0026
--- Epoch 1093 / 1506 - 2587 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0038
--- Epoch 1094 / 1506 - 2588 epochs total
Iteration 0, loss = 0.0135
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0027
--- Epoch 1095 / 1506 - 2589 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0027
--- Epoch 1096 / 1506 - 2590 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0031
--- Epoch 1097 / 1506 - 2591 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0034
--- Epoch 1098 / 1506 - 2592 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0067
--- Epoch 1099 / 1506 - 2593 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0025
--- Epoch 1100 / 1506 - 2594 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0129
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0030
--- Epoch 1101 / 1506 - 2595 epochs total
Iteration 0, loss = 0.0254
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0033
--- Epoch 1102 / 1506 - 2596 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0049
--- Epoch 1103 / 1506 - 2597 epochs total
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0028
--- Epoch 1104 / 1506 - 2598 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0051
--- Epoch 1105 / 1506 - 2599 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0037
--- Epoch 1106 / 1506 - 2600 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0043
--- Epoch 1107 / 1506 - 2601 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0030
--- Epoch 1108 / 1506 - 2602 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0049
--- Epoch 1109 / 1506 - 2603 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0025
--- Epoch 1110 / 1506 - 2604 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0079
--- Epoch 1111 / 1506 - 2605 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0031
--- Epoch 1112 / 1506 - 2606 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0047
--- Epoch 1113 / 1506 - 2607 epochs total
Iteration 0, loss = 0.0084
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0024
--- Epoch 1114 / 1506 - 2608 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0057
--- Epoch 1115 / 1506 - 2609 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0088
--- Epoch 1116 / 1506 - 2610 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0027
--- Epoch 1117 / 1506 - 2611 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0054
--- Epoch 1118 / 1506 - 2612 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0024
--- Epoch 1119 / 1506 - 2613 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0029
--- Epoch 1120 / 1506 - 2614 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0020
--- Epoch 1121 / 1506 - 2615 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0067
--- Epoch 1122 / 1506 - 2616 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0057
--- Epoch 1123 / 1506 - 2617 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0025
--- Epoch 1124 / 1506 - 2618 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0019
--- Epoch 1125 / 1506 - 2619 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0253
--- Epoch 1126 / 1506 - 2620 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0077
--- Epoch 1127 / 1506 - 2621 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0046
--- Epoch 1128 / 1506 - 2622 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0028
--- Epoch 1129 / 1506 - 2623 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0022
--- Epoch 1130 / 1506 - 2624 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0029
--- Epoch 1131 / 1506 - 2625 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0114
--- Epoch 1132 / 1506 - 2626 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0016
--- Epoch 1133 / 1506 - 2627 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0024
--- Epoch 1134 / 1506 - 2628 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0089
--- Epoch 1135 / 1506 - 2629 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0065
--- Epoch 1136 / 1506 - 2630 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0037
--- Epoch 1137 / 1506 - 2631 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0124
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0033
--- Epoch 1138 / 1506 - 2632 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0019
--- Epoch 1139 / 1506 - 2633 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0018
--- Epoch 1140 / 1506 - 2634 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0035
--- Epoch 1141 / 1506 - 2635 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0037
--- Epoch 1142 / 1506 - 2636 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0023
--- Epoch 1143 / 1506 - 2637 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0065
--- Epoch 1144 / 1506 - 2638 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0039
--- Epoch 1145 / 1506 - 2639 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0023
--- Epoch 1146 / 1506 - 2640 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0075
--- Epoch 1147 / 1506 - 2641 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0070
--- Epoch 1148 / 1506 - 2642 epochs total
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0031
--- Epoch 1149 / 1506 - 2643 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0046
--- Epoch 1150 / 1506 - 2644 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0054
--- Epoch 1151 / 1506 - 2645 epochs total
Iteration 0, loss = 0.0176
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0030
--- Epoch 1152 / 1506 - 2646 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0083
--- Epoch 1153 / 1506 - 2647 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0054
--- Epoch 1154 / 1506 - 2648 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0039
--- Epoch 1155 / 1506 - 2649 epochs total
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0040
--- Epoch 1156 / 1506 - 2650 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0038
--- Epoch 1157 / 1506 - 2651 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0084
--- Epoch 1158 / 1506 - 2652 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0024
--- Epoch 1159 / 1506 - 2653 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0042
--- Epoch 1160 / 1506 - 2654 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0027
--- Epoch 1161 / 1506 - 2655 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0030
--- Epoch 1162 / 1506 - 2656 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0060
--- Epoch 1163 / 1506 - 2657 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0053
--- Epoch 1164 / 1506 - 2658 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0287
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0042
--- Epoch 1165 / 1506 - 2659 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0024
--- Epoch 1166 / 1506 - 2660 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0022
--- Epoch 1167 / 1506 - 2661 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0024
--- Epoch 1168 / 1506 - 2662 epochs total
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0044
--- Epoch 1169 / 1506 - 2663 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0029
--- Epoch 1170 / 1506 - 2664 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0210
Iteration 80, loss = 0.0054
--- Epoch 1171 / 1506 - 2665 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0027
--- Epoch 1172 / 1506 - 2666 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0032
--- Epoch 1173 / 1506 - 2667 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0055
--- Epoch 1174 / 1506 - 2668 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0049
--- Epoch 1175 / 1506 - 2669 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0042
--- Epoch 1176 / 1506 - 2670 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0066
--- Epoch 1177 / 1506 - 2671 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0050
--- Epoch 1178 / 1506 - 2672 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0033
--- Epoch 1179 / 1506 - 2673 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0061
--- Epoch 1180 / 1506 - 2674 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0052
--- Epoch 1181 / 1506 - 2675 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0192
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0023
--- Epoch 1182 / 1506 - 2676 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0035
--- Epoch 1183 / 1506 - 2677 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0045
--- Epoch 1184 / 1506 - 2678 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0079
--- Epoch 1185 / 1506 - 2679 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0050
--- Epoch 1186 / 1506 - 2680 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0026
--- Epoch 1187 / 1506 - 2681 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0026
--- Epoch 1188 / 1506 - 2682 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0024
--- Epoch 1189 / 1506 - 2683 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0032
--- Epoch 1190 / 1506 - 2684 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0077
--- Epoch 1191 / 1506 - 2685 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0049
--- Epoch 1192 / 1506 - 2686 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0016
--- Epoch 1193 / 1506 - 2687 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0029
--- Epoch 1194 / 1506 - 2688 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0041
--- Epoch 1195 / 1506 - 2689 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0029
--- Epoch 1196 / 1506 - 2690 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0043
--- Epoch 1197 / 1506 - 2691 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0054
--- Epoch 1198 / 1506 - 2692 epochs total
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0069
--- Epoch 1199 / 1506 - 2693 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0035
--- Epoch 1200 / 1506 - 2694 epochs total
Iteration 0, loss = 0.0109
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0140
--- Epoch 1201 / 1506 - 2695 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0036
--- Epoch 1202 / 1506 - 2696 epochs total
Iteration 0, loss = 0.0512
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0091
--- Epoch 1203 / 1506 - 2697 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0127
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0029
--- Epoch 1204 / 1506 - 2698 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0045
--- Epoch 1205 / 1506 - 2699 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0031
--- Epoch 1206 / 1506 - 2700 epochs total
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0059
--- Epoch 1207 / 1506 - 2701 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0534
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0028
--- Epoch 1208 / 1506 - 2702 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0029
--- Epoch 1209 / 1506 - 2703 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0042
--- Epoch 1210 / 1506 - 2704 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0416
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0026
--- Epoch 1211 / 1506 - 2705 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0025
--- Epoch 1212 / 1506 - 2706 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0045
--- Epoch 1213 / 1506 - 2707 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0056
--- Epoch 1214 / 1506 - 2708 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0035
--- Epoch 1215 / 1506 - 2709 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0022
--- Epoch 1216 / 1506 - 2710 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0059
--- Epoch 1217 / 1506 - 2711 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0022
--- Epoch 1218 / 1506 - 2712 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0024
--- Epoch 1219 / 1506 - 2713 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0287
Iteration 80, loss = 0.0038
--- Epoch 1220 / 1506 - 2714 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0041
--- Epoch 1221 / 1506 - 2715 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0040
--- Epoch 1222 / 1506 - 2716 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0034
--- Epoch 1223 / 1506 - 2717 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0053
--- Epoch 1224 / 1506 - 2718 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0041
--- Epoch 1225 / 1506 - 2719 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0040
--- Epoch 1226 / 1506 - 2720 epochs total
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0050
--- Epoch 1227 / 1506 - 2721 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0067
--- Epoch 1228 / 1506 - 2722 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0043
--- Epoch 1229 / 1506 - 2723 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0029
--- Epoch 1230 / 1506 - 2724 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0038
--- Epoch 1231 / 1506 - 2725 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0059
--- Epoch 1232 / 1506 - 2726 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0021
--- Epoch 1233 / 1506 - 2727 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0059
--- Epoch 1234 / 1506 - 2728 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0080
--- Epoch 1235 / 1506 - 2729 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0058
--- Epoch 1236 / 1506 - 2730 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0042
--- Epoch 1237 / 1506 - 2731 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0101
Iteration 80, loss = 0.0080
--- Epoch 1238 / 1506 - 2732 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0410
Iteration 40, loss = 0.0230
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0015
--- Epoch 1239 / 1506 - 2733 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0070
--- Epoch 1240 / 1506 - 2734 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0039
--- Epoch 1241 / 1506 - 2735 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0038
--- Epoch 1242 / 1506 - 2736 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0029
--- Epoch 1243 / 1506 - 2737 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0070
--- Epoch 1244 / 1506 - 2738 epochs total
Iteration 0, loss = 0.0109
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0050
--- Epoch 1245 / 1506 - 2739 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0063
--- Epoch 1246 / 1506 - 2740 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0040
--- Epoch 1247 / 1506 - 2741 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0056
--- Epoch 1248 / 1506 - 2742 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0056
--- Epoch 1249 / 1506 - 2743 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0047
--- Epoch 1250 / 1506 - 2744 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0035
--- Epoch 1251 / 1506 - 2745 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0025
--- Epoch 1252 / 1506 - 2746 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0067
--- Epoch 1253 / 1506 - 2747 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0035
--- Epoch 1254 / 1506 - 2748 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0084
--- Epoch 1255 / 1506 - 2749 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0073
--- Epoch 1256 / 1506 - 2750 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0042
--- Epoch 1257 / 1506 - 2751 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0020
--- Epoch 1258 / 1506 - 2752 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0019
--- Epoch 1259 / 1506 - 2753 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0069
--- Epoch 1260 / 1506 - 2754 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0214
Iteration 80, loss = 0.0030
--- Epoch 1261 / 1506 - 2755 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0129
--- Epoch 1262 / 1506 - 2756 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0025
--- Epoch 1263 / 1506 - 2757 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0051
--- Epoch 1264 / 1506 - 2758 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0036
--- Epoch 1265 / 1506 - 2759 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0039
--- Epoch 1266 / 1506 - 2760 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0119
--- Epoch 1267 / 1506 - 2761 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0024
--- Epoch 1268 / 1506 - 2762 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0041
--- Epoch 1269 / 1506 - 2763 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0035
--- Epoch 1270 / 1506 - 2764 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0054
--- Epoch 1271 / 1506 - 2765 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0105
--- Epoch 1272 / 1506 - 2766 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0022
--- Epoch 1273 / 1506 - 2767 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0043
--- Epoch 1274 / 1506 - 2768 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0718
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0026
--- Epoch 1275 / 1506 - 2769 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0028
--- Epoch 1276 / 1506 - 2770 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0035
--- Epoch 1277 / 1506 - 2771 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0148
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0024
--- Epoch 1278 / 1506 - 2772 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0058
--- Epoch 1279 / 1506 - 2773 epochs total
Iteration 0, loss = 0.0097
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0060
--- Epoch 1280 / 1506 - 2774 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0111
--- Epoch 1281 / 1506 - 2775 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0184
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0027
--- Epoch 1282 / 1506 - 2776 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0021
--- Epoch 1283 / 1506 - 2777 epochs total
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0044
--- Epoch 1284 / 1506 - 2778 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0039
--- Epoch 1285 / 1506 - 2779 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0127
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0031
--- Epoch 1286 / 1506 - 2780 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0057
--- Epoch 1287 / 1506 - 2781 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0026
--- Epoch 1288 / 1506 - 2782 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0035
--- Epoch 1289 / 1506 - 2783 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0106
--- Epoch 1290 / 1506 - 2784 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0061
--- Epoch 1291 / 1506 - 2785 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0028
--- Epoch 1292 / 1506 - 2786 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0028
--- Epoch 1293 / 1506 - 2787 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0029
--- Epoch 1294 / 1506 - 2788 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0033
--- Epoch 1295 / 1506 - 2789 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0031
--- Epoch 1296 / 1506 - 2790 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0087
--- Epoch 1297 / 1506 - 2791 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0035
--- Epoch 1298 / 1506 - 2792 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0019
--- Epoch 1299 / 1506 - 2793 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0043
--- Epoch 1300 / 1506 - 2794 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0039
--- Epoch 1301 / 1506 - 2795 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0030
--- Epoch 1302 / 1506 - 2796 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0131
Iteration 80, loss = 0.0034
--- Epoch 1303 / 1506 - 2797 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0222
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0063
--- Epoch 1304 / 1506 - 2798 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0073
--- Epoch 1305 / 1506 - 2799 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0184
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0025
--- Epoch 1306 / 1506 - 2800 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0151
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0053
--- Epoch 1307 / 1506 - 2801 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0056
--- Epoch 1308 / 1506 - 2802 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0031
--- Epoch 1309 / 1506 - 2803 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0050
--- Epoch 1310 / 1506 - 2804 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0018
--- Epoch 1311 / 1506 - 2805 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0035
--- Epoch 1312 / 1506 - 2806 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0059
--- Epoch 1313 / 1506 - 2807 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0017
--- Epoch 1314 / 1506 - 2808 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0011
--- Epoch 1315 / 1506 - 2809 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0037
--- Epoch 1316 / 1506 - 2810 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0028
--- Epoch 1317 / 1506 - 2811 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0037
--- Epoch 1318 / 1506 - 2812 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0025
--- Epoch 1319 / 1506 - 2813 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0026
--- Epoch 1320 / 1506 - 2814 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0074
--- Epoch 1321 / 1506 - 2815 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0027
--- Epoch 1322 / 1506 - 2816 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0058
--- Epoch 1323 / 1506 - 2817 epochs total
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0027
--- Epoch 1324 / 1506 - 2818 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0041
--- Epoch 1325 / 1506 - 2819 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0065
--- Epoch 1326 / 1506 - 2820 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0039
--- Epoch 1327 / 1506 - 2821 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0044
--- Epoch 1328 / 1506 - 2822 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0022
--- Epoch 1329 / 1506 - 2823 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0065
--- Epoch 1330 / 1506 - 2824 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0086
--- Epoch 1331 / 1506 - 2825 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0138
--- Epoch 1332 / 1506 - 2826 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0033
--- Epoch 1333 / 1506 - 2827 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0042
--- Epoch 1334 / 1506 - 2828 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0089
--- Epoch 1335 / 1506 - 2829 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0226
--- Epoch 1336 / 1506 - 2830 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0060
--- Epoch 1337 / 1506 - 2831 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0035
--- Epoch 1338 / 1506 - 2832 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0035
--- Epoch 1339 / 1506 - 2833 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0017
--- Epoch 1340 / 1506 - 2834 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0045
--- Epoch 1341 / 1506 - 2835 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0095
--- Epoch 1342 / 1506 - 2836 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0022
--- Epoch 1343 / 1506 - 2837 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0042
--- Epoch 1344 / 1506 - 2838 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0076
--- Epoch 1345 / 1506 - 2839 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0036
--- Epoch 1346 / 1506 - 2840 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0032
--- Epoch 1347 / 1506 - 2841 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0039
--- Epoch 1348 / 1506 - 2842 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0065
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0017
--- Epoch 1349 / 1506 - 2843 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0023
--- Epoch 1350 / 1506 - 2844 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0021
--- Epoch 1351 / 1506 - 2845 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0034
--- Epoch 1352 / 1506 - 2846 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0038
--- Epoch 1353 / 1506 - 2847 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0063
--- Epoch 1354 / 1506 - 2848 epochs total
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0036
--- Epoch 1355 / 1506 - 2849 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0046
--- Epoch 1356 / 1506 - 2850 epochs total
Iteration 0, loss = 0.0127
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0048
--- Epoch 1357 / 1506 - 2851 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0082
--- Epoch 1358 / 1506 - 2852 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0065
--- Epoch 1359 / 1506 - 2853 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0135
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0023
--- Epoch 1360 / 1506 - 2854 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0020
--- Epoch 1361 / 1506 - 2855 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0053
--- Epoch 1362 / 1506 - 2856 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0028
--- Epoch 1363 / 1506 - 2857 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0042
--- Epoch 1364 / 1506 - 2858 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0064
--- Epoch 1365 / 1506 - 2859 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0052
--- Epoch 1366 / 1506 - 2860 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0043
--- Epoch 1367 / 1506 - 2861 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0047
--- Epoch 1368 / 1506 - 2862 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0036
--- Epoch 1369 / 1506 - 2863 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0018
--- Epoch 1370 / 1506 - 2864 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0136
--- Epoch 1371 / 1506 - 2865 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0043
--- Epoch 1372 / 1506 - 2866 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0022
--- Epoch 1373 / 1506 - 2867 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0065
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0038
--- Epoch 1374 / 1506 - 2868 epochs total
Iteration 0, loss = 0.0101
Iteration 20, loss = 0.0161
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0032
--- Epoch 1375 / 1506 - 2869 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0027
--- Epoch 1376 / 1506 - 2870 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0112
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0030
--- Epoch 1377 / 1506 - 2871 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0039
--- Epoch 1378 / 1506 - 2872 epochs total
Iteration 0, loss = 0.0082
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0034
--- Epoch 1379 / 1506 - 2873 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0397
--- Epoch 1380 / 1506 - 2874 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0044
--- Epoch 1381 / 1506 - 2875 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0035
--- Epoch 1382 / 1506 - 2876 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0223
--- Epoch 1383 / 1506 - 2877 epochs total
Iteration 0, loss = 0.0332
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0072
--- Epoch 1384 / 1506 - 2878 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0029
--- Epoch 1385 / 1506 - 2879 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0037
--- Epoch 1386 / 1506 - 2880 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0054
--- Epoch 1387 / 1506 - 2881 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0040
--- Epoch 1388 / 1506 - 2882 epochs total
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0068
--- Epoch 1389 / 1506 - 2883 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0036
--- Epoch 1390 / 1506 - 2884 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0170
--- Epoch 1391 / 1506 - 2885 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0022
--- Epoch 1392 / 1506 - 2886 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0041
--- Epoch 1393 / 1506 - 2887 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0022
--- Epoch 1394 / 1506 - 2888 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0033
--- Epoch 1395 / 1506 - 2889 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0040
--- Epoch 1396 / 1506 - 2890 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0097
--- Epoch 1397 / 1506 - 2891 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0022
--- Epoch 1398 / 1506 - 2892 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0039
--- Epoch 1399 / 1506 - 2893 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0055
--- Epoch 1400 / 1506 - 2894 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0037
--- Epoch 1401 / 1506 - 2895 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0042
--- Epoch 1402 / 1506 - 2896 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0147
--- Epoch 1403 / 1506 - 2897 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0042
--- Epoch 1404 / 1506 - 2898 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0028
--- Epoch 1405 / 1506 - 2899 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0026
--- Epoch 1406 / 1506 - 2900 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0125
--- Epoch 1407 / 1506 - 2901 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0193
--- Epoch 1408 / 1506 - 2902 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0054
--- Epoch 1409 / 1506 - 2903 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0035
--- Epoch 1410 / 1506 - 2904 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0031
--- Epoch 1411 / 1506 - 2905 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0043
--- Epoch 1412 / 1506 - 2906 epochs total
Iteration 0, loss = 0.0407
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0036
--- Epoch 1413 / 1506 - 2907 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0047
--- Epoch 1414 / 1506 - 2908 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0148
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0028
--- Epoch 1415 / 1506 - 2909 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0031
--- Epoch 1416 / 1506 - 2910 epochs total
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0292
Iteration 80, loss = 0.0050
--- Epoch 1417 / 1506 - 2911 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0049
--- Epoch 1418 / 1506 - 2912 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0055
--- Epoch 1419 / 1506 - 2913 epochs total
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0026
--- Epoch 1420 / 1506 - 2914 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0200
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0096
--- Epoch 1421 / 1506 - 2915 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0025
--- Epoch 1422 / 1506 - 2916 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0027
--- Epoch 1423 / 1506 - 2917 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0024
--- Epoch 1424 / 1506 - 2918 epochs total
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0025
--- Epoch 1425 / 1506 - 2919 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0141
Iteration 40, loss = 0.0124
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0083
--- Epoch 1426 / 1506 - 2920 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0123
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0058
--- Epoch 1427 / 1506 - 2921 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0034
--- Epoch 1428 / 1506 - 2922 epochs total
Iteration 0, loss = 0.0109
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0052
--- Epoch 1429 / 1506 - 2923 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0088
--- Epoch 1430 / 1506 - 2924 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0044
--- Epoch 1431 / 1506 - 2925 epochs total
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0053
--- Epoch 1432 / 1506 - 2926 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0022
--- Epoch 1433 / 1506 - 2927 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0013
--- Epoch 1434 / 1506 - 2928 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0039
--- Epoch 1435 / 1506 - 2929 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0099
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0059
--- Epoch 1436 / 1506 - 2930 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0153
--- Epoch 1437 / 1506 - 2931 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0048
--- Epoch 1438 / 1506 - 2932 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0017
--- Epoch 1439 / 1506 - 2933 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0022
--- Epoch 1440 / 1506 - 2934 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0023
--- Epoch 1441 / 1506 - 2935 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0036
--- Epoch 1442 / 1506 - 2936 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0026
--- Epoch 1443 / 1506 - 2937 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0026
--- Epoch 1444 / 1506 - 2938 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0059
--- Epoch 1445 / 1506 - 2939 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0032
--- Epoch 1446 / 1506 - 2940 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0067
--- Epoch 1447 / 1506 - 2941 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0086
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0050
--- Epoch 1448 / 1506 - 2942 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0033
--- Epoch 1449 / 1506 - 2943 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0098
--- Epoch 1450 / 1506 - 2944 epochs total
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0022
--- Epoch 1451 / 1506 - 2945 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0017
--- Epoch 1452 / 1506 - 2946 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0029
--- Epoch 1453 / 1506 - 2947 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0097
--- Epoch 1454 / 1506 - 2948 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0027
--- Epoch 1455 / 1506 - 2949 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0030
--- Epoch 1456 / 1506 - 2950 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0020
--- Epoch 1457 / 1506 - 2951 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0046
--- Epoch 1458 / 1506 - 2952 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0099
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0018
--- Epoch 1459 / 1506 - 2953 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0070
--- Epoch 1460 / 1506 - 2954 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0023
--- Epoch 1461 / 1506 - 2955 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0139
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0281
--- Epoch 1462 / 1506 - 2956 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0088
--- Epoch 1463 / 1506 - 2957 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0048
--- Epoch 1464 / 1506 - 2958 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0025
--- Epoch 1465 / 1506 - 2959 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0031
--- Epoch 1466 / 1506 - 2960 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0028
--- Epoch 1467 / 1506 - 2961 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0025
--- Epoch 1468 / 1506 - 2962 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0087
--- Epoch 1469 / 1506 - 2963 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0036
--- Epoch 1470 / 1506 - 2964 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0064
--- Epoch 1471 / 1506 - 2965 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0030
--- Epoch 1472 / 1506 - 2966 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0070
--- Epoch 1473 / 1506 - 2967 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0023
--- Epoch 1474 / 1506 - 2968 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0035
--- Epoch 1475 / 1506 - 2969 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0026
--- Epoch 1476 / 1506 - 2970 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0280
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0076
--- Epoch 1477 / 1506 - 2971 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0040
--- Epoch 1478 / 1506 - 2972 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0037
--- Epoch 1479 / 1506 - 2973 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0015
--- Epoch 1480 / 1506 - 2974 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0028
--- Epoch 1481 / 1506 - 2975 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0031
--- Epoch 1482 / 1506 - 2976 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0020
--- Epoch 1483 / 1506 - 2977 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0078
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0031
--- Epoch 1484 / 1506 - 2978 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0044
--- Epoch 1485 / 1506 - 2979 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0037
--- Epoch 1486 / 1506 - 2980 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0033
--- Epoch 1487 / 1506 - 2981 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0041
--- Epoch 1488 / 1506 - 2982 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0086
--- Epoch 1489 / 1506 - 2983 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0022
--- Epoch 1490 / 1506 - 2984 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0045
--- Epoch 1491 / 1506 - 2985 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0041
--- Epoch 1492 / 1506 - 2986 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0111
Iteration 80, loss = 0.0059
--- Epoch 1493 / 1506 - 2987 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0023
--- Epoch 1494 / 1506 - 2988 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0058
--- Epoch 1495 / 1506 - 2989 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0118
--- Epoch 1496 / 1506 - 2990 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0054
--- Epoch 1497 / 1506 - 2991 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0253
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0024
--- Epoch 1498 / 1506 - 2992 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0047
--- Epoch 1499 / 1506 - 2993 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0011
--- Epoch 1500 / 1506 - 2994 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0178
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0043
--- Epoch 1501 / 1506 - 2995 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0021
--- Epoch 1502 / 1506 - 2996 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0534
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0100
--- Epoch 1503 / 1506 - 2997 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0030
--- Epoch 1504 / 1506 - 2998 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0057
--- Epoch 1505 / 1506 - 2999 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0016
--- Epoch 1506 / 1506 - 3000 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0061
In [168]:
testModel(model12, x_test=data["X_test_horse"], y_test=data["y_test_horse"], criterion=nn.MSELoss())
In [68]:
learning_rate = 1e-2
model13 = ConvNet4()
optimizer = optim.SGD(model13.parameters(), lr=learning_rate)
In [135]:
train(model13, optimizer, epochs=1369, x_train=data["X_train_truck"],  y_train=data["y_train_truck"], criterion=nn.MSELoss())
--- Epoch 1 / 1369 - 1634 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0030
--- Epoch 2 / 1369 - 1635 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0008
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0036
--- Epoch 3 / 1369 - 1636 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0037
--- Epoch 4 / 1369 - 1637 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0020
--- Epoch 5 / 1369 - 1638 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0046
--- Epoch 6 / 1369 - 1639 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0054
--- Epoch 7 / 1369 - 1640 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0093
--- Epoch 8 / 1369 - 1641 epochs total
Iteration 0, loss = 0.0006
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0132
--- Epoch 9 / 1369 - 1642 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0015
--- Epoch 10 / 1369 - 1643 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0185
--- Epoch 11 / 1369 - 1644 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0252
Iteration 80, loss = 0.0018
--- Epoch 12 / 1369 - 1645 epochs total
Iteration 0, loss = 0.0158
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0027
--- Epoch 13 / 1369 - 1646 epochs total
Iteration 0, loss = 0.0227
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0014
--- Epoch 14 / 1369 - 1647 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0013
--- Epoch 15 / 1369 - 1648 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0065
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0031
--- Epoch 16 / 1369 - 1649 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0122
--- Epoch 17 / 1369 - 1650 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0199
--- Epoch 18 / 1369 - 1651 epochs total
Iteration 0, loss = 0.0127
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0014
--- Epoch 19 / 1369 - 1652 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0012
--- Epoch 20 / 1369 - 1653 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0286
--- Epoch 21 / 1369 - 1654 epochs total
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0021
--- Epoch 22 / 1369 - 1655 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0009
Iteration 80, loss = 0.0036
--- Epoch 23 / 1369 - 1656 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0042
--- Epoch 24 / 1369 - 1657 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0015
--- Epoch 25 / 1369 - 1658 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0121
Iteration 60, loss = 0.0180
Iteration 80, loss = 0.0123
--- Epoch 26 / 1369 - 1659 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0164
--- Epoch 27 / 1369 - 1660 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0026
--- Epoch 28 / 1369 - 1661 epochs total
Iteration 0, loss = 0.0172
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0043
--- Epoch 29 / 1369 - 1662 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0005
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0051
--- Epoch 30 / 1369 - 1663 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0122
--- Epoch 31 / 1369 - 1664 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0029
--- Epoch 32 / 1369 - 1665 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0019
--- Epoch 33 / 1369 - 1666 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0171
--- Epoch 34 / 1369 - 1667 epochs total
Iteration 0, loss = 0.0202
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0054
--- Epoch 35 / 1369 - 1668 epochs total
Iteration 0, loss = 0.0008
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0047
--- Epoch 36 / 1369 - 1669 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0043
--- Epoch 37 / 1369 - 1670 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0033
--- Epoch 38 / 1369 - 1671 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0061
--- Epoch 39 / 1369 - 1672 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0088
--- Epoch 40 / 1369 - 1673 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0279
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0128
--- Epoch 41 / 1369 - 1674 epochs total
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0127
Iteration 80, loss = 0.0015
--- Epoch 42 / 1369 - 1675 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0012
--- Epoch 43 / 1369 - 1676 epochs total
Iteration 0, loss = 0.0008
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0012
--- Epoch 44 / 1369 - 1677 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0058
--- Epoch 45 / 1369 - 1678 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0081
--- Epoch 46 / 1369 - 1679 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0059
--- Epoch 47 / 1369 - 1680 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0005
Iteration 80, loss = 0.0042
--- Epoch 48 / 1369 - 1681 epochs total
Iteration 0, loss = 0.0082
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0072
--- Epoch 49 / 1369 - 1682 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0041
--- Epoch 50 / 1369 - 1683 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0010
--- Epoch 51 / 1369 - 1684 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0118
--- Epoch 52 / 1369 - 1685 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0042
--- Epoch 53 / 1369 - 1686 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0031
--- Epoch 54 / 1369 - 1687 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0025
--- Epoch 55 / 1369 - 1688 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0005
--- Epoch 56 / 1369 - 1689 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0127
Iteration 80, loss = 0.0027
--- Epoch 57 / 1369 - 1690 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0037
--- Epoch 58 / 1369 - 1691 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0029
--- Epoch 59 / 1369 - 1692 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0013
--- Epoch 60 / 1369 - 1693 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0169
--- Epoch 61 / 1369 - 1694 epochs total
Iteration 0, loss = 0.0199
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0034
--- Epoch 62 / 1369 - 1695 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0089
--- Epoch 63 / 1369 - 1696 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0188
--- Epoch 64 / 1369 - 1697 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0009
Iteration 80, loss = 0.0048
--- Epoch 65 / 1369 - 1698 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0205
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0052
--- Epoch 66 / 1369 - 1699 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0009
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0025
--- Epoch 67 / 1369 - 1700 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0092
--- Epoch 68 / 1369 - 1701 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0008
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0064
--- Epoch 69 / 1369 - 1702 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0008
Iteration 60, loss = 0.0252
Iteration 80, loss = 0.0076
--- Epoch 70 / 1369 - 1703 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0008
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0056
--- Epoch 71 / 1369 - 1704 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0005
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0028
--- Epoch 72 / 1369 - 1705 epochs total
Iteration 0, loss = 0.0007
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0024
--- Epoch 73 / 1369 - 1706 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0093
--- Epoch 74 / 1369 - 1707 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0052
--- Epoch 75 / 1369 - 1708 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0034
--- Epoch 76 / 1369 - 1709 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0016
--- Epoch 77 / 1369 - 1710 epochs total
Iteration 0, loss = 0.0296
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0041
--- Epoch 78 / 1369 - 1711 epochs total
Iteration 0, loss = 0.0082
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0018
--- Epoch 79 / 1369 - 1712 epochs total
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0051
--- Epoch 80 / 1369 - 1713 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0185
Iteration 80, loss = 0.0066
--- Epoch 81 / 1369 - 1714 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0190
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0068
--- Epoch 82 / 1369 - 1715 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0244
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0062
--- Epoch 83 / 1369 - 1716 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0007
--- Epoch 84 / 1369 - 1717 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0053
--- Epoch 85 / 1369 - 1718 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0131
--- Epoch 86 / 1369 - 1719 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0015
--- Epoch 87 / 1369 - 1720 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0029
--- Epoch 88 / 1369 - 1721 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0011
--- Epoch 89 / 1369 - 1722 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0082
--- Epoch 90 / 1369 - 1723 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0008
--- Epoch 91 / 1369 - 1724 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0034
--- Epoch 92 / 1369 - 1725 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0005
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0029
--- Epoch 93 / 1369 - 1726 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0010
--- Epoch 94 / 1369 - 1727 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0145
Iteration 80, loss = 0.0021
--- Epoch 95 / 1369 - 1728 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0117
Iteration 40, loss = 0.0210
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0029
--- Epoch 96 / 1369 - 1729 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0093
--- Epoch 97 / 1369 - 1730 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0015
--- Epoch 98 / 1369 - 1731 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0027
--- Epoch 99 / 1369 - 1732 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0016
--- Epoch 100 / 1369 - 1733 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0153
--- Epoch 101 / 1369 - 1734 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0025
--- Epoch 102 / 1369 - 1735 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0171
Iteration 80, loss = 0.0105
--- Epoch 103 / 1369 - 1736 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0007
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0019
--- Epoch 104 / 1369 - 1737 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0020
--- Epoch 105 / 1369 - 1738 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0050
--- Epoch 106 / 1369 - 1739 epochs total
Iteration 0, loss = 0.0006
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0014
--- Epoch 107 / 1369 - 1740 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0145
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0192
Iteration 80, loss = 0.0024
--- Epoch 108 / 1369 - 1741 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0138
--- Epoch 109 / 1369 - 1742 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0055
--- Epoch 110 / 1369 - 1743 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0015
--- Epoch 111 / 1369 - 1744 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0057
--- Epoch 112 / 1369 - 1745 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0088
--- Epoch 113 / 1369 - 1746 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0121
Iteration 80, loss = 0.0025
--- Epoch 114 / 1369 - 1747 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0023
--- Epoch 115 / 1369 - 1748 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0206
--- Epoch 116 / 1369 - 1749 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0240
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0054
--- Epoch 117 / 1369 - 1750 epochs total
Iteration 0, loss = 0.0139
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0075
--- Epoch 118 / 1369 - 1751 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0332
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0045
--- Epoch 119 / 1369 - 1752 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0149
--- Epoch 120 / 1369 - 1753 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0018
--- Epoch 121 / 1369 - 1754 epochs total
Iteration 0, loss = 0.0204
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0192
--- Epoch 122 / 1369 - 1755 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0035
--- Epoch 123 / 1369 - 1756 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0035
--- Epoch 124 / 1369 - 1757 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0036
--- Epoch 125 / 1369 - 1758 epochs total
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0134
--- Epoch 126 / 1369 - 1759 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0175
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0012
--- Epoch 127 / 1369 - 1760 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0033
--- Epoch 128 / 1369 - 1761 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0074
--- Epoch 129 / 1369 - 1762 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0034
--- Epoch 130 / 1369 - 1763 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0078
--- Epoch 131 / 1369 - 1764 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0279
Iteration 80, loss = 0.0081
--- Epoch 132 / 1369 - 1765 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0021
--- Epoch 133 / 1369 - 1766 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0013
--- Epoch 134 / 1369 - 1767 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0158
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0065
--- Epoch 135 / 1369 - 1768 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0007
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0016
--- Epoch 136 / 1369 - 1769 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0278
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0038
--- Epoch 137 / 1369 - 1770 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0048
--- Epoch 138 / 1369 - 1771 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0029
--- Epoch 139 / 1369 - 1772 epochs total
Iteration 0, loss = 0.0150
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0042
--- Epoch 140 / 1369 - 1773 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0133
--- Epoch 141 / 1369 - 1774 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0091
--- Epoch 142 / 1369 - 1775 epochs total
Iteration 0, loss = 0.0137
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0096
--- Epoch 143 / 1369 - 1776 epochs total
Iteration 0, loss = 0.0097
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0019
--- Epoch 144 / 1369 - 1777 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0013
--- Epoch 145 / 1369 - 1778 epochs total
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0021
--- Epoch 146 / 1369 - 1779 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0018
--- Epoch 147 / 1369 - 1780 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0105
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0077
--- Epoch 148 / 1369 - 1781 epochs total
Iteration 0, loss = 0.0235
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0061
--- Epoch 149 / 1369 - 1782 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0083
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0061
--- Epoch 150 / 1369 - 1783 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0206
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0049
--- Epoch 151 / 1369 - 1784 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0209
--- Epoch 152 / 1369 - 1785 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0008
Iteration 80, loss = 0.0022
--- Epoch 153 / 1369 - 1786 epochs total
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0040
--- Epoch 154 / 1369 - 1787 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0039
--- Epoch 155 / 1369 - 1788 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0224
Iteration 80, loss = 0.0034
--- Epoch 156 / 1369 - 1789 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0016
--- Epoch 157 / 1369 - 1790 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0041
--- Epoch 158 / 1369 - 1791 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0025
--- Epoch 159 / 1369 - 1792 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0397
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0170
--- Epoch 160 / 1369 - 1793 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0088
--- Epoch 161 / 1369 - 1794 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0053
--- Epoch 162 / 1369 - 1795 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0086
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0088
--- Epoch 163 / 1369 - 1796 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0040
--- Epoch 164 / 1369 - 1797 epochs total
Iteration 0, loss = 0.0256
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0044
--- Epoch 165 / 1369 - 1798 epochs total
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0073
--- Epoch 166 / 1369 - 1799 epochs total
Iteration 0, loss = 0.0130
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0120
--- Epoch 167 / 1369 - 1800 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0138
--- Epoch 168 / 1369 - 1801 epochs total
Iteration 0, loss = 0.0137
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0034
--- Epoch 169 / 1369 - 1802 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0087
--- Epoch 170 / 1369 - 1803 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0240
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0024
--- Epoch 171 / 1369 - 1804 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0008
--- Epoch 172 / 1369 - 1805 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0151
--- Epoch 173 / 1369 - 1806 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0127
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0034
--- Epoch 174 / 1369 - 1807 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0038
--- Epoch 175 / 1369 - 1808 epochs total
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0075
--- Epoch 176 / 1369 - 1809 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0006
Iteration 60, loss = 0.0196
Iteration 80, loss = 0.0082
--- Epoch 177 / 1369 - 1810 epochs total
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0071
--- Epoch 178 / 1369 - 1811 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0060
--- Epoch 179 / 1369 - 1812 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0261
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0048
--- Epoch 180 / 1369 - 1813 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0211
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0119
--- Epoch 181 / 1369 - 1814 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0088
--- Epoch 182 / 1369 - 1815 epochs total
Iteration 0, loss = 0.0139
Iteration 20, loss = 0.0146
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0015
--- Epoch 183 / 1369 - 1816 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0054
--- Epoch 184 / 1369 - 1817 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0026
--- Epoch 185 / 1369 - 1818 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0170
Iteration 80, loss = 0.0129
--- Epoch 186 / 1369 - 1819 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0027
--- Epoch 187 / 1369 - 1820 epochs total
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0081
--- Epoch 188 / 1369 - 1821 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0029
--- Epoch 189 / 1369 - 1822 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0162
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0023
--- Epoch 190 / 1369 - 1823 epochs total
Iteration 0, loss = 0.0211
Iteration 20, loss = 0.0151
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0025
--- Epoch 191 / 1369 - 1824 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0101
--- Epoch 192 / 1369 - 1825 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0168
Iteration 80, loss = 0.0067
--- Epoch 193 / 1369 - 1826 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0116
--- Epoch 194 / 1369 - 1827 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0035
--- Epoch 195 / 1369 - 1828 epochs total
Iteration 0, loss = 0.0007
Iteration 20, loss = 0.0065
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0030
--- Epoch 196 / 1369 - 1829 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0067
--- Epoch 197 / 1369 - 1830 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0020
--- Epoch 198 / 1369 - 1831 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0139
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0128
--- Epoch 199 / 1369 - 1832 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0021
--- Epoch 200 / 1369 - 1833 epochs total
Iteration 0, loss = 0.0281
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0058
--- Epoch 201 / 1369 - 1834 epochs total
Iteration 0, loss = 0.0103
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0080
--- Epoch 202 / 1369 - 1835 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0019
--- Epoch 203 / 1369 - 1836 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0242
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0104
--- Epoch 204 / 1369 - 1837 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0054
--- Epoch 205 / 1369 - 1838 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0187
Iteration 80, loss = 0.0110
--- Epoch 206 / 1369 - 1839 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0055
--- Epoch 207 / 1369 - 1840 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0037
--- Epoch 208 / 1369 - 1841 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0099
Iteration 40, loss = 0.0282
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0013
--- Epoch 209 / 1369 - 1842 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0041
--- Epoch 210 / 1369 - 1843 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0083
--- Epoch 211 / 1369 - 1844 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0132
Iteration 80, loss = 0.0091
--- Epoch 212 / 1369 - 1845 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0062
--- Epoch 213 / 1369 - 1846 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0046
--- Epoch 214 / 1369 - 1847 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0310
Iteration 80, loss = 0.0021
--- Epoch 215 / 1369 - 1848 epochs total
Iteration 0, loss = 0.0130
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0379
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0074
--- Epoch 216 / 1369 - 1849 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0017
--- Epoch 217 / 1369 - 1850 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0130
--- Epoch 218 / 1369 - 1851 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0094
--- Epoch 219 / 1369 - 1852 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0030
--- Epoch 220 / 1369 - 1853 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0020
--- Epoch 221 / 1369 - 1854 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0024
--- Epoch 222 / 1369 - 1855 epochs total
Iteration 0, loss = 0.0007
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0063
--- Epoch 223 / 1369 - 1856 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0094
--- Epoch 224 / 1369 - 1857 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0164
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0046
--- Epoch 225 / 1369 - 1858 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0088
--- Epoch 226 / 1369 - 1859 epochs total
Iteration 0, loss = 0.0005
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0060
--- Epoch 227 / 1369 - 1860 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0014
--- Epoch 228 / 1369 - 1861 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0050
--- Epoch 229 / 1369 - 1862 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0011
--- Epoch 230 / 1369 - 1863 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0095
--- Epoch 231 / 1369 - 1864 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0092
--- Epoch 232 / 1369 - 1865 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0027
--- Epoch 233 / 1369 - 1866 epochs total
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0029
--- Epoch 234 / 1369 - 1867 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0026
--- Epoch 235 / 1369 - 1868 epochs total
Iteration 0, loss = 0.0206
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0021
--- Epoch 236 / 1369 - 1869 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0078
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0023
--- Epoch 237 / 1369 - 1870 epochs total
Iteration 0, loss = 0.0168
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0069
--- Epoch 238 / 1369 - 1871 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0008
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0037
--- Epoch 239 / 1369 - 1872 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0018
--- Epoch 240 / 1369 - 1873 epochs total
Iteration 0, loss = 0.0182
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0019
--- Epoch 241 / 1369 - 1874 epochs total
Iteration 0, loss = 0.0004
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0078
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0042
--- Epoch 242 / 1369 - 1875 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0035
--- Epoch 243 / 1369 - 1876 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0028
--- Epoch 244 / 1369 - 1877 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0014
--- Epoch 245 / 1369 - 1878 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0029
--- Epoch 246 / 1369 - 1879 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0095
--- Epoch 247 / 1369 - 1880 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0008
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0026
--- Epoch 248 / 1369 - 1881 epochs total
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0013
--- Epoch 249 / 1369 - 1882 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0005
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0046
--- Epoch 250 / 1369 - 1883 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0105
--- Epoch 251 / 1369 - 1884 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0134
--- Epoch 252 / 1369 - 1885 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0012
--- Epoch 253 / 1369 - 1886 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0009
--- Epoch 254 / 1369 - 1887 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0045
--- Epoch 255 / 1369 - 1888 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0034
--- Epoch 256 / 1369 - 1889 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0079
--- Epoch 257 / 1369 - 1890 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0042
--- Epoch 258 / 1369 - 1891 epochs total
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0157
Iteration 80, loss = 0.0077
--- Epoch 259 / 1369 - 1892 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0017
--- Epoch 260 / 1369 - 1893 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0081
--- Epoch 261 / 1369 - 1894 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0047
--- Epoch 262 / 1369 - 1895 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0045
--- Epoch 263 / 1369 - 1896 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0029
--- Epoch 264 / 1369 - 1897 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0022
--- Epoch 265 / 1369 - 1898 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0019
--- Epoch 266 / 1369 - 1899 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0128
Iteration 80, loss = 0.0012
--- Epoch 267 / 1369 - 1900 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0174
Iteration 80, loss = 0.0045
--- Epoch 268 / 1369 - 1901 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0207
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0043
--- Epoch 269 / 1369 - 1902 epochs total
Iteration 0, loss = 0.0284
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0163
Iteration 80, loss = 0.0041
--- Epoch 270 / 1369 - 1903 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0021
--- Epoch 271 / 1369 - 1904 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0092
--- Epoch 272 / 1369 - 1905 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0310
--- Epoch 273 / 1369 - 1906 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0018
--- Epoch 274 / 1369 - 1907 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0058
--- Epoch 275 / 1369 - 1908 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0008
Iteration 80, loss = 0.0035
--- Epoch 276 / 1369 - 1909 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0019
--- Epoch 277 / 1369 - 1910 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0116
Iteration 80, loss = 0.0041
--- Epoch 278 / 1369 - 1911 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0023
--- Epoch 279 / 1369 - 1912 epochs total
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0161
Iteration 80, loss = 0.0019
--- Epoch 280 / 1369 - 1913 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0015
--- Epoch 281 / 1369 - 1914 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0074
--- Epoch 282 / 1369 - 1915 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0137
Iteration 80, loss = 0.0064
--- Epoch 283 / 1369 - 1916 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0040
--- Epoch 284 / 1369 - 1917 epochs total
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0026
--- Epoch 285 / 1369 - 1918 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0250
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0025
--- Epoch 286 / 1369 - 1919 epochs total
Iteration 0, loss = 0.0150
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0074
--- Epoch 287 / 1369 - 1920 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0022
--- Epoch 288 / 1369 - 1921 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0005
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0038
--- Epoch 289 / 1369 - 1922 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0019
--- Epoch 290 / 1369 - 1923 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0046
--- Epoch 291 / 1369 - 1924 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0235
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0053
--- Epoch 292 / 1369 - 1925 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0009
Iteration 80, loss = 0.0056
--- Epoch 293 / 1369 - 1926 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0073
--- Epoch 294 / 1369 - 1927 epochs total
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0031
--- Epoch 295 / 1369 - 1928 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0020
--- Epoch 296 / 1369 - 1929 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0033
--- Epoch 297 / 1369 - 1930 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0017
--- Epoch 298 / 1369 - 1931 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0173
--- Epoch 299 / 1369 - 1932 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0015
--- Epoch 300 / 1369 - 1933 epochs total
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0008
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0010
--- Epoch 301 / 1369 - 1934 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0125
--- Epoch 302 / 1369 - 1935 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0029
--- Epoch 303 / 1369 - 1936 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0051
--- Epoch 304 / 1369 - 1937 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0068
--- Epoch 305 / 1369 - 1938 epochs total
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0015
--- Epoch 306 / 1369 - 1939 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0032
--- Epoch 307 / 1369 - 1940 epochs total
Iteration 0, loss = 0.0135
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0057
--- Epoch 308 / 1369 - 1941 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0178
--- Epoch 309 / 1369 - 1942 epochs total
Iteration 0, loss = 0.0310
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0006
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0032
--- Epoch 310 / 1369 - 1943 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0025
--- Epoch 311 / 1369 - 1944 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0076
--- Epoch 312 / 1369 - 1945 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0073
--- Epoch 313 / 1369 - 1946 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0076
--- Epoch 314 / 1369 - 1947 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0009
--- Epoch 315 / 1369 - 1948 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0016
--- Epoch 316 / 1369 - 1949 epochs total
Iteration 0, loss = 0.0232
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0036
--- Epoch 317 / 1369 - 1950 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0099
--- Epoch 318 / 1369 - 1951 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0008
Iteration 80, loss = 0.0013
--- Epoch 319 / 1369 - 1952 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0079
--- Epoch 320 / 1369 - 1953 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0015
--- Epoch 321 / 1369 - 1954 epochs total
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0163
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0038
--- Epoch 322 / 1369 - 1955 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0022
--- Epoch 323 / 1369 - 1956 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0010
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0055
--- Epoch 324 / 1369 - 1957 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0078
--- Epoch 325 / 1369 - 1958 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0162
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0017
--- Epoch 326 / 1369 - 1959 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0100
--- Epoch 327 / 1369 - 1960 epochs total
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0054
--- Epoch 328 / 1369 - 1961 epochs total
Iteration 0, loss = 0.0084
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0036
--- Epoch 329 / 1369 - 1962 epochs total
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0087
--- Epoch 330 / 1369 - 1963 epochs total
Iteration 0, loss = 0.0165
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0035
--- Epoch 331 / 1369 - 1964 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0115
Iteration 40, loss = 0.0164
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0014
--- Epoch 332 / 1369 - 1965 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0038
--- Epoch 333 / 1369 - 1966 epochs total
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0156
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0329
--- Epoch 334 / 1369 - 1967 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0005
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0015
--- Epoch 335 / 1369 - 1968 epochs total
Iteration 0, loss = 0.0101
Iteration 20, loss = 0.0204
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0173
Iteration 80, loss = 0.0048
--- Epoch 336 / 1369 - 1969 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0022
--- Epoch 337 / 1369 - 1970 epochs total
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0159
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0016
--- Epoch 338 / 1369 - 1971 epochs total
Iteration 0, loss = 0.0006
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0076
--- Epoch 339 / 1369 - 1972 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0008
Iteration 80, loss = 0.0034
--- Epoch 340 / 1369 - 1973 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0052
--- Epoch 341 / 1369 - 1974 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0011
--- Epoch 342 / 1369 - 1975 epochs total
Iteration 0, loss = 0.0180
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0151
--- Epoch 343 / 1369 - 1976 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0020
--- Epoch 344 / 1369 - 1977 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0005
Iteration 80, loss = 0.0095
--- Epoch 345 / 1369 - 1978 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0024
--- Epoch 346 / 1369 - 1979 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0013
--- Epoch 347 / 1369 - 1980 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0009
--- Epoch 348 / 1369 - 1981 epochs total
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0060
--- Epoch 349 / 1369 - 1982 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0333
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0067
--- Epoch 350 / 1369 - 1983 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0026
--- Epoch 351 / 1369 - 1984 epochs total
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0018
--- Epoch 352 / 1369 - 1985 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0035
--- Epoch 353 / 1369 - 1986 epochs total
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0009
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0256
--- Epoch 354 / 1369 - 1987 epochs total
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0050
--- Epoch 355 / 1369 - 1988 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0147
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0020
--- Epoch 356 / 1369 - 1989 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0223
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0052
--- Epoch 357 / 1369 - 1990 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0108
--- Epoch 358 / 1369 - 1991 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0100
--- Epoch 359 / 1369 - 1992 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0062
--- Epoch 360 / 1369 - 1993 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0008
Iteration 80, loss = 0.0021
--- Epoch 361 / 1369 - 1994 epochs total
Iteration 0, loss = 0.0286
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0005
Iteration 80, loss = 0.0031
--- Epoch 362 / 1369 - 1995 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0020
--- Epoch 363 / 1369 - 1996 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0261
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0021
--- Epoch 364 / 1369 - 1997 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0061
--- Epoch 365 / 1369 - 1998 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0048
--- Epoch 366 / 1369 - 1999 epochs total
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0011
--- Epoch 367 / 1369 - 2000 epochs total
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0020
--- Epoch 368 / 1369 - 2001 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0069
--- Epoch 369 / 1369 - 2002 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0023
--- Epoch 370 / 1369 - 2003 epochs total
Iteration 0, loss = 0.0242
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0128
Iteration 80, loss = 0.0034
--- Epoch 371 / 1369 - 2004 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0067
--- Epoch 372 / 1369 - 2005 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0023
--- Epoch 373 / 1369 - 2006 epochs total
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0049
--- Epoch 374 / 1369 - 2007 epochs total
Iteration 0, loss = 0.0109
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0054
--- Epoch 375 / 1369 - 2008 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0033
--- Epoch 376 / 1369 - 2009 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0011
--- Epoch 377 / 1369 - 2010 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0009
Iteration 80, loss = 0.0054
--- Epoch 378 / 1369 - 2011 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0131
--- Epoch 379 / 1369 - 2012 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0009
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0046
--- Epoch 380 / 1369 - 2013 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0296
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0077
--- Epoch 381 / 1369 - 2014 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0016
--- Epoch 382 / 1369 - 2015 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0016
--- Epoch 383 / 1369 - 2016 epochs total
Iteration 0, loss = 0.0127
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0058
--- Epoch 384 / 1369 - 2017 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0009
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0031
--- Epoch 385 / 1369 - 2018 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0069
--- Epoch 386 / 1369 - 2019 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0027
--- Epoch 387 / 1369 - 2020 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0011
--- Epoch 388 / 1369 - 2021 epochs total
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0047
--- Epoch 389 / 1369 - 2022 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0034
--- Epoch 390 / 1369 - 2023 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0035
--- Epoch 391 / 1369 - 2024 epochs total
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0219
Iteration 80, loss = 0.0007
--- Epoch 392 / 1369 - 2025 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0134
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0018
--- Epoch 393 / 1369 - 2026 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0021
--- Epoch 394 / 1369 - 2027 epochs total
Iteration 0, loss = 0.0097
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0075
--- Epoch 395 / 1369 - 2028 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0017
--- Epoch 396 / 1369 - 2029 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0022
--- Epoch 397 / 1369 - 2030 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0352
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0058
--- Epoch 398 / 1369 - 2031 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0056
--- Epoch 399 / 1369 - 2032 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0009
--- Epoch 400 / 1369 - 2033 epochs total
Iteration 0, loss = 0.0109
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0109
--- Epoch 401 / 1369 - 2034 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0127
--- Epoch 402 / 1369 - 2035 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0013
--- Epoch 403 / 1369 - 2036 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0079
--- Epoch 404 / 1369 - 2037 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0069
--- Epoch 405 / 1369 - 2038 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0070
--- Epoch 406 / 1369 - 2039 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0152
--- Epoch 407 / 1369 - 2040 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0146
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0044
--- Epoch 408 / 1369 - 2041 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0157
Iteration 60, loss = 0.0500
Iteration 80, loss = 0.0037
--- Epoch 409 / 1369 - 2042 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0101
Iteration 80, loss = 0.0093
--- Epoch 410 / 1369 - 2043 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0023
--- Epoch 411 / 1369 - 2044 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0155
Iteration 60, loss = 0.0009
Iteration 80, loss = 0.0109
--- Epoch 412 / 1369 - 2045 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0046
--- Epoch 413 / 1369 - 2046 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0222
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0037
--- Epoch 414 / 1369 - 2047 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0030
--- Epoch 415 / 1369 - 2048 epochs total
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0153
Iteration 80, loss = 0.0023
--- Epoch 416 / 1369 - 2049 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0024
--- Epoch 417 / 1369 - 2050 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0029
--- Epoch 418 / 1369 - 2051 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0068
--- Epoch 419 / 1369 - 2052 epochs total
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0041
--- Epoch 420 / 1369 - 2053 epochs total
Iteration 0, loss = 0.0157
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0094
--- Epoch 421 / 1369 - 2054 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0108
Iteration 40, loss = 0.0182
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0088
--- Epoch 422 / 1369 - 2055 epochs total
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0014
--- Epoch 423 / 1369 - 2056 epochs total
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0012
--- Epoch 424 / 1369 - 2057 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0090
--- Epoch 425 / 1369 - 2058 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0208
Iteration 80, loss = 0.0033
--- Epoch 426 / 1369 - 2059 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0022
--- Epoch 427 / 1369 - 2060 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0058
--- Epoch 428 / 1369 - 2061 epochs total
Iteration 0, loss = 0.0207
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0038
--- Epoch 429 / 1369 - 2062 epochs total
Iteration 0, loss = 0.0191
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0123
Iteration 80, loss = 0.0029
--- Epoch 430 / 1369 - 2063 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0006
--- Epoch 431 / 1369 - 2064 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0030
--- Epoch 432 / 1369 - 2065 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0010
--- Epoch 433 / 1369 - 2066 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0021
--- Epoch 434 / 1369 - 2067 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0188
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0008
--- Epoch 435 / 1369 - 2068 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0100
--- Epoch 436 / 1369 - 2069 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0008
Iteration 80, loss = 0.0027
--- Epoch 437 / 1369 - 2070 epochs total
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0018
--- Epoch 438 / 1369 - 2071 epochs total
Iteration 0, loss = 0.0203
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0079
--- Epoch 439 / 1369 - 2072 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0007
Iteration 80, loss = 0.0084
--- Epoch 440 / 1369 - 2073 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0237
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0115
Iteration 80, loss = 0.0058
--- Epoch 441 / 1369 - 2074 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0033
--- Epoch 442 / 1369 - 2075 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0025
--- Epoch 443 / 1369 - 2076 epochs total
Iteration 0, loss = 0.0170
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0112
--- Epoch 444 / 1369 - 2077 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0008
--- Epoch 445 / 1369 - 2078 epochs total
Iteration 0, loss = 0.0171
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0034
--- Epoch 446 / 1369 - 2079 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0081
--- Epoch 447 / 1369 - 2080 epochs total
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0137
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0081
--- Epoch 448 / 1369 - 2081 epochs total
Iteration 0, loss = 0.0101
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0015
--- Epoch 449 / 1369 - 2082 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0040
--- Epoch 450 / 1369 - 2083 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0016
--- Epoch 451 / 1369 - 2084 epochs total
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0046
--- Epoch 452 / 1369 - 2085 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0061
--- Epoch 453 / 1369 - 2086 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0311
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0090
--- Epoch 454 / 1369 - 2087 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0042
--- Epoch 455 / 1369 - 2088 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0037
--- Epoch 456 / 1369 - 2089 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0208
--- Epoch 457 / 1369 - 2090 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0009
--- Epoch 458 / 1369 - 2091 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0179
--- Epoch 459 / 1369 - 2092 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0169
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0044
--- Epoch 460 / 1369 - 2093 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0006
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0019
--- Epoch 461 / 1369 - 2094 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0064
--- Epoch 462 / 1369 - 2095 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0144
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0011
--- Epoch 463 / 1369 - 2096 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0008
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0048
--- Epoch 464 / 1369 - 2097 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0019
--- Epoch 465 / 1369 - 2098 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0061
--- Epoch 466 / 1369 - 2099 epochs total
Iteration 0, loss = 0.0135
Iteration 20, loss = 0.0010
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0053
--- Epoch 467 / 1369 - 2100 epochs total
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0045
--- Epoch 468 / 1369 - 2101 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0192
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0025
--- Epoch 469 / 1369 - 2102 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0019
--- Epoch 470 / 1369 - 2103 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0206
Iteration 80, loss = 0.0110
--- Epoch 471 / 1369 - 2104 epochs total
Iteration 0, loss = 0.0005
Iteration 20, loss = 0.0128
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0032
--- Epoch 472 / 1369 - 2105 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0226
--- Epoch 473 / 1369 - 2106 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0024
--- Epoch 474 / 1369 - 2107 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0050
--- Epoch 475 / 1369 - 2108 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0037
--- Epoch 476 / 1369 - 2109 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0050
--- Epoch 477 / 1369 - 2110 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0172
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0156
--- Epoch 478 / 1369 - 2111 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0020
--- Epoch 479 / 1369 - 2112 epochs total
Iteration 0, loss = 0.0134
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0065
--- Epoch 480 / 1369 - 2113 epochs total
Iteration 0, loss = 0.0006
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0022
--- Epoch 481 / 1369 - 2114 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0015
--- Epoch 482 / 1369 - 2115 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0082
--- Epoch 483 / 1369 - 2116 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0015
--- Epoch 484 / 1369 - 2117 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0009
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0012
--- Epoch 485 / 1369 - 2118 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0038
--- Epoch 486 / 1369 - 2119 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0006
Iteration 60, loss = 0.0007
Iteration 80, loss = 0.0014
--- Epoch 487 / 1369 - 2120 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0042
--- Epoch 488 / 1369 - 2121 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0051
--- Epoch 489 / 1369 - 2122 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0065
--- Epoch 490 / 1369 - 2123 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0053
--- Epoch 491 / 1369 - 2124 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0049
--- Epoch 492 / 1369 - 2125 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0098
--- Epoch 493 / 1369 - 2126 epochs total
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0017
--- Epoch 494 / 1369 - 2127 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0015
--- Epoch 495 / 1369 - 2128 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0021
--- Epoch 496 / 1369 - 2129 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0024
--- Epoch 497 / 1369 - 2130 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0148
--- Epoch 498 / 1369 - 2131 epochs total
Iteration 0, loss = 0.0184
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0057
--- Epoch 499 / 1369 - 2132 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0018
--- Epoch 500 / 1369 - 2133 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0029
--- Epoch 501 / 1369 - 2134 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0056
--- Epoch 502 / 1369 - 2135 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0033
--- Epoch 503 / 1369 - 2136 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0038
--- Epoch 504 / 1369 - 2137 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0073
--- Epoch 505 / 1369 - 2138 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0021
--- Epoch 506 / 1369 - 2139 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0031
--- Epoch 507 / 1369 - 2140 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0046
--- Epoch 508 / 1369 - 2141 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0055
--- Epoch 509 / 1369 - 2142 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0088
--- Epoch 510 / 1369 - 2143 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0148
--- Epoch 511 / 1369 - 2144 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0039
--- Epoch 512 / 1369 - 2145 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0031
--- Epoch 513 / 1369 - 2146 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0226
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0036
--- Epoch 514 / 1369 - 2147 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0068
--- Epoch 515 / 1369 - 2148 epochs total
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0048
--- Epoch 516 / 1369 - 2149 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0010
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0017
--- Epoch 517 / 1369 - 2150 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0025
--- Epoch 518 / 1369 - 2151 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0047
--- Epoch 519 / 1369 - 2152 epochs total
Iteration 0, loss = 0.0139
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0036
--- Epoch 520 / 1369 - 2153 epochs total
Iteration 0, loss = 0.0007
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0116
--- Epoch 521 / 1369 - 2154 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0118
--- Epoch 522 / 1369 - 2155 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0035
--- Epoch 523 / 1369 - 2156 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0045
--- Epoch 524 / 1369 - 2157 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0019
--- Epoch 525 / 1369 - 2158 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0036
--- Epoch 526 / 1369 - 2159 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0035
--- Epoch 527 / 1369 - 2160 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0084
--- Epoch 528 / 1369 - 2161 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0011
--- Epoch 529 / 1369 - 2162 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0058
--- Epoch 530 / 1369 - 2163 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0012
--- Epoch 531 / 1369 - 2164 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0048
--- Epoch 532 / 1369 - 2165 epochs total
Iteration 0, loss = 0.0352
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0029
--- Epoch 533 / 1369 - 2166 epochs total
Iteration 0, loss = 0.0215
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0036
--- Epoch 534 / 1369 - 2167 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0025
--- Epoch 535 / 1369 - 2168 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0081
--- Epoch 536 / 1369 - 2169 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0016
--- Epoch 537 / 1369 - 2170 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0048
--- Epoch 538 / 1369 - 2171 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0127
--- Epoch 539 / 1369 - 2172 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0054
--- Epoch 540 / 1369 - 2173 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0009
--- Epoch 541 / 1369 - 2174 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0041
--- Epoch 542 / 1369 - 2175 epochs total
Iteration 0, loss = 0.0192
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0007
Iteration 80, loss = 0.0026
--- Epoch 543 / 1369 - 2176 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0071
--- Epoch 544 / 1369 - 2177 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0006
--- Epoch 545 / 1369 - 2178 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0053
--- Epoch 546 / 1369 - 2179 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0130
--- Epoch 547 / 1369 - 2180 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0046
--- Epoch 548 / 1369 - 2181 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0310
Iteration 80, loss = 0.0043
--- Epoch 549 / 1369 - 2182 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0010
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0031
--- Epoch 550 / 1369 - 2183 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0005
--- Epoch 551 / 1369 - 2184 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0021
--- Epoch 552 / 1369 - 2185 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0007
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0024
--- Epoch 553 / 1369 - 2186 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0043
--- Epoch 554 / 1369 - 2187 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0017
--- Epoch 555 / 1369 - 2188 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0083
--- Epoch 556 / 1369 - 2189 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0018
--- Epoch 557 / 1369 - 2190 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0021
--- Epoch 558 / 1369 - 2191 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0057
--- Epoch 559 / 1369 - 2192 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0144
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0139
--- Epoch 560 / 1369 - 2193 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0011
--- Epoch 561 / 1369 - 2194 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0045
--- Epoch 562 / 1369 - 2195 epochs total
Iteration 0, loss = 0.0242
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0122
--- Epoch 563 / 1369 - 2196 epochs total
Iteration 0, loss = 0.0083
Iteration 20, loss = 0.0310
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0008
Iteration 80, loss = 0.0019
--- Epoch 564 / 1369 - 2197 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0049
--- Epoch 565 / 1369 - 2198 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0023
--- Epoch 566 / 1369 - 2199 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0019
--- Epoch 567 / 1369 - 2200 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0113
--- Epoch 568 / 1369 - 2201 epochs total
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0156
Iteration 80, loss = 0.0030
--- Epoch 569 / 1369 - 2202 epochs total
Iteration 0, loss = 0.0007
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0121
Iteration 80, loss = 0.0414
--- Epoch 570 / 1369 - 2203 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0131
Iteration 80, loss = 0.0073
--- Epoch 571 / 1369 - 2204 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0151
--- Epoch 572 / 1369 - 2205 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0029
--- Epoch 573 / 1369 - 2206 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0172
--- Epoch 574 / 1369 - 2207 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0021
--- Epoch 575 / 1369 - 2208 epochs total
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0083
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0081
--- Epoch 576 / 1369 - 2209 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0018
--- Epoch 577 / 1369 - 2210 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0027
--- Epoch 578 / 1369 - 2211 epochs total
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0022
--- Epoch 579 / 1369 - 2212 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0030
--- Epoch 580 / 1369 - 2213 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0062
--- Epoch 581 / 1369 - 2214 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0029
--- Epoch 582 / 1369 - 2215 epochs total
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0282
Iteration 80, loss = 0.0055
--- Epoch 583 / 1369 - 2216 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0314
--- Epoch 584 / 1369 - 2217 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0016
--- Epoch 585 / 1369 - 2218 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0038
--- Epoch 586 / 1369 - 2219 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0030
--- Epoch 587 / 1369 - 2220 epochs total
Iteration 0, loss = 0.0008
Iteration 20, loss = 0.0124
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0007
Iteration 80, loss = 0.0010
--- Epoch 588 / 1369 - 2221 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0048
--- Epoch 589 / 1369 - 2222 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0015
--- Epoch 590 / 1369 - 2223 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0007
Iteration 60, loss = 0.0123
Iteration 80, loss = 0.0040
--- Epoch 591 / 1369 - 2224 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0021
--- Epoch 592 / 1369 - 2225 epochs total
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0086
--- Epoch 593 / 1369 - 2226 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0032
--- Epoch 594 / 1369 - 2227 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0022
--- Epoch 595 / 1369 - 2228 epochs total
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0132
--- Epoch 596 / 1369 - 2229 epochs total
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0181
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0085
--- Epoch 597 / 1369 - 2230 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0108
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0091
--- Epoch 598 / 1369 - 2231 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0015
--- Epoch 599 / 1369 - 2232 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0127
--- Epoch 600 / 1369 - 2233 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0065
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0118
--- Epoch 601 / 1369 - 2234 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0029
--- Epoch 602 / 1369 - 2235 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0023
--- Epoch 603 / 1369 - 2236 epochs total
Iteration 0, loss = 0.0103
Iteration 20, loss = 0.0146
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0013
--- Epoch 604 / 1369 - 2237 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0033
--- Epoch 605 / 1369 - 2238 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0033
--- Epoch 606 / 1369 - 2239 epochs total
Iteration 0, loss = 0.0131
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0017
--- Epoch 607 / 1369 - 2240 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0111
Iteration 80, loss = 0.0023
--- Epoch 608 / 1369 - 2241 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0015
--- Epoch 609 / 1369 - 2242 epochs total
Iteration 0, loss = 0.0097
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0053
--- Epoch 610 / 1369 - 2243 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0030
--- Epoch 611 / 1369 - 2244 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0300
Iteration 80, loss = 0.0074
--- Epoch 612 / 1369 - 2245 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0083
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0033
--- Epoch 613 / 1369 - 2246 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0012
--- Epoch 614 / 1369 - 2247 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0209
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0009
--- Epoch 615 / 1369 - 2248 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0164
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0040
--- Epoch 616 / 1369 - 2249 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0030
--- Epoch 617 / 1369 - 2250 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0014
--- Epoch 618 / 1369 - 2251 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0050
--- Epoch 619 / 1369 - 2252 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0041
--- Epoch 620 / 1369 - 2253 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0015
--- Epoch 621 / 1369 - 2254 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0040
--- Epoch 622 / 1369 - 2255 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0022
--- Epoch 623 / 1369 - 2256 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0053
--- Epoch 624 / 1369 - 2257 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0166
Iteration 80, loss = 0.0029
--- Epoch 625 / 1369 - 2258 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0174
Iteration 80, loss = 0.0038
--- Epoch 626 / 1369 - 2259 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0030
--- Epoch 627 / 1369 - 2260 epochs total
Iteration 0, loss = 0.0250
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0014
--- Epoch 628 / 1369 - 2261 epochs total
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0040
--- Epoch 629 / 1369 - 2262 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0045
--- Epoch 630 / 1369 - 2263 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0168
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0029
--- Epoch 631 / 1369 - 2264 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0182
--- Epoch 632 / 1369 - 2265 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0053
--- Epoch 633 / 1369 - 2266 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0042
--- Epoch 634 / 1369 - 2267 epochs total
Iteration 0, loss = 0.0109
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0039
--- Epoch 635 / 1369 - 2268 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0010
--- Epoch 636 / 1369 - 2269 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0136
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0013
--- Epoch 637 / 1369 - 2270 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0019
--- Epoch 638 / 1369 - 2271 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0046
--- Epoch 639 / 1369 - 2272 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0062
--- Epoch 640 / 1369 - 2273 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0131
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0062
--- Epoch 641 / 1369 - 2274 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0094
--- Epoch 642 / 1369 - 2275 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0032
--- Epoch 643 / 1369 - 2276 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0017
--- Epoch 644 / 1369 - 2277 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0136
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0081
--- Epoch 645 / 1369 - 2278 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0018
--- Epoch 646 / 1369 - 2279 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0177
--- Epoch 647 / 1369 - 2280 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0025
--- Epoch 648 / 1369 - 2281 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0055
--- Epoch 649 / 1369 - 2282 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0497
Iteration 80, loss = 0.0060
--- Epoch 650 / 1369 - 2283 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0031
--- Epoch 651 / 1369 - 2284 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0043
--- Epoch 652 / 1369 - 2285 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0039
--- Epoch 653 / 1369 - 2286 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0029
--- Epoch 654 / 1369 - 2287 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0022
--- Epoch 655 / 1369 - 2288 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0034
--- Epoch 656 / 1369 - 2289 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0033
--- Epoch 657 / 1369 - 2290 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0009
--- Epoch 658 / 1369 - 2291 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0021
--- Epoch 659 / 1369 - 2292 epochs total
Iteration 0, loss = 0.0083
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0007
--- Epoch 660 / 1369 - 2293 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0250
--- Epoch 661 / 1369 - 2294 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0088
--- Epoch 662 / 1369 - 2295 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0055
--- Epoch 663 / 1369 - 2296 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0014
--- Epoch 664 / 1369 - 2297 epochs total
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0120
Iteration 80, loss = 0.0056
--- Epoch 665 / 1369 - 2298 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0149
--- Epoch 666 / 1369 - 2299 epochs total
Iteration 0, loss = 0.0319
Iteration 20, loss = 0.0115
Iteration 40, loss = 0.0181
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0041
--- Epoch 667 / 1369 - 2300 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0085
--- Epoch 668 / 1369 - 2301 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0059
--- Epoch 669 / 1369 - 2302 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0094
--- Epoch 670 / 1369 - 2303 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0020
--- Epoch 671 / 1369 - 2304 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0100
--- Epoch 672 / 1369 - 2305 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0008
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0030
--- Epoch 673 / 1369 - 2306 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0319
--- Epoch 674 / 1369 - 2307 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0210
Iteration 80, loss = 0.0010
--- Epoch 675 / 1369 - 2308 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0058
--- Epoch 676 / 1369 - 2309 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0280
Iteration 80, loss = 0.0085
--- Epoch 677 / 1369 - 2310 epochs total
Iteration 0, loss = 0.0170
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0104
--- Epoch 678 / 1369 - 2311 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0035
--- Epoch 679 / 1369 - 2312 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0027
--- Epoch 680 / 1369 - 2313 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0023
--- Epoch 681 / 1369 - 2314 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0021
--- Epoch 682 / 1369 - 2315 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0034
--- Epoch 683 / 1369 - 2316 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0039
--- Epoch 684 / 1369 - 2317 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0016
--- Epoch 685 / 1369 - 2318 epochs total
Iteration 0, loss = 0.0310
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0030
--- Epoch 686 / 1369 - 2319 epochs total
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0060
--- Epoch 687 / 1369 - 2320 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0124
--- Epoch 688 / 1369 - 2321 epochs total
Iteration 0, loss = 0.0242
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0016
--- Epoch 689 / 1369 - 2322 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0054
--- Epoch 690 / 1369 - 2323 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0284
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0187
--- Epoch 691 / 1369 - 2324 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0115
--- Epoch 692 / 1369 - 2325 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0014
--- Epoch 693 / 1369 - 2326 epochs total
Iteration 0, loss = 0.0135
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0015
--- Epoch 694 / 1369 - 2327 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0088
--- Epoch 695 / 1369 - 2328 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0139
--- Epoch 696 / 1369 - 2329 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0088
--- Epoch 697 / 1369 - 2330 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0016
--- Epoch 698 / 1369 - 2331 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0378
--- Epoch 699 / 1369 - 2332 epochs total
Iteration 0, loss = 0.0237
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0019
--- Epoch 700 / 1369 - 2333 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0026
--- Epoch 701 / 1369 - 2334 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0022
--- Epoch 702 / 1369 - 2335 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0018
--- Epoch 703 / 1369 - 2336 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0025
--- Epoch 704 / 1369 - 2337 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0020
--- Epoch 705 / 1369 - 2338 epochs total
Iteration 0, loss = 0.0082
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0008
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0060
--- Epoch 706 / 1369 - 2339 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0019
--- Epoch 707 / 1369 - 2340 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0016
--- Epoch 708 / 1369 - 2341 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0202
Iteration 60, loss = 0.0009
Iteration 80, loss = 0.0029
--- Epoch 709 / 1369 - 2342 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0019
--- Epoch 710 / 1369 - 2343 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0062
--- Epoch 711 / 1369 - 2344 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0057
--- Epoch 712 / 1369 - 2345 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0385
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0037
--- Epoch 713 / 1369 - 2346 epochs total
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0069
--- Epoch 714 / 1369 - 2347 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0014
--- Epoch 715 / 1369 - 2348 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0021
--- Epoch 716 / 1369 - 2349 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0013
--- Epoch 717 / 1369 - 2350 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0127
Iteration 80, loss = 0.0087
--- Epoch 718 / 1369 - 2351 epochs total
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0005
Iteration 80, loss = 0.0035
--- Epoch 719 / 1369 - 2352 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0016
--- Epoch 720 / 1369 - 2353 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0015
--- Epoch 721 / 1369 - 2354 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0210
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0038
--- Epoch 722 / 1369 - 2355 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0005
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0032
--- Epoch 723 / 1369 - 2356 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0073
--- Epoch 724 / 1369 - 2357 epochs total
Iteration 0, loss = 0.0169
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0008
--- Epoch 725 / 1369 - 2358 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0158
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0045
--- Epoch 726 / 1369 - 2359 epochs total
Iteration 0, loss = 0.0161
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0104
--- Epoch 727 / 1369 - 2360 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0158
Iteration 80, loss = 0.0058
--- Epoch 728 / 1369 - 2361 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0027
--- Epoch 729 / 1369 - 2362 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0127
--- Epoch 730 / 1369 - 2363 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0035
--- Epoch 731 / 1369 - 2364 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0157
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0106
--- Epoch 732 / 1369 - 2365 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0022
--- Epoch 733 / 1369 - 2366 epochs total
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0137
--- Epoch 734 / 1369 - 2367 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0045
--- Epoch 735 / 1369 - 2368 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0023
--- Epoch 736 / 1369 - 2369 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0020
--- Epoch 737 / 1369 - 2370 epochs total
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0020
--- Epoch 738 / 1369 - 2371 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0006
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0080
--- Epoch 739 / 1369 - 2372 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0058
--- Epoch 740 / 1369 - 2373 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0027
--- Epoch 741 / 1369 - 2374 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0206
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0091
--- Epoch 742 / 1369 - 2375 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0010
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0023
--- Epoch 743 / 1369 - 2376 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0020
--- Epoch 744 / 1369 - 2377 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0158
Iteration 80, loss = 0.0269
--- Epoch 745 / 1369 - 2378 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0042
--- Epoch 746 / 1369 - 2379 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0153
--- Epoch 747 / 1369 - 2380 epochs total
Iteration 0, loss = 0.0167
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0107
--- Epoch 748 / 1369 - 2381 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0008
Iteration 80, loss = 0.0123
--- Epoch 749 / 1369 - 2382 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0379
Iteration 80, loss = 0.0011
--- Epoch 750 / 1369 - 2383 epochs total
Iteration 0, loss = 0.0109
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0007
--- Epoch 751 / 1369 - 2384 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0027
--- Epoch 752 / 1369 - 2385 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0071
--- Epoch 753 / 1369 - 2386 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0045
--- Epoch 754 / 1369 - 2387 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0059
--- Epoch 755 / 1369 - 2388 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0034
--- Epoch 756 / 1369 - 2389 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0199
--- Epoch 757 / 1369 - 2390 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0160
Iteration 60, loss = 0.0120
Iteration 80, loss = 0.0072
--- Epoch 758 / 1369 - 2391 epochs total
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0012
--- Epoch 759 / 1369 - 2392 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0007
Iteration 80, loss = 0.0025
--- Epoch 760 / 1369 - 2393 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0069
--- Epoch 761 / 1369 - 2394 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0005
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0038
--- Epoch 762 / 1369 - 2395 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0011
--- Epoch 763 / 1369 - 2396 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0006
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0019
--- Epoch 764 / 1369 - 2397 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0112
--- Epoch 765 / 1369 - 2398 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0282
Iteration 80, loss = 0.0012
--- Epoch 766 / 1369 - 2399 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0181
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0092
--- Epoch 767 / 1369 - 2400 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0006
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0021
--- Epoch 768 / 1369 - 2401 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0194
Iteration 80, loss = 0.0025
--- Epoch 769 / 1369 - 2402 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0129
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0052
--- Epoch 770 / 1369 - 2403 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0024
--- Epoch 771 / 1369 - 2404 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0014
--- Epoch 772 / 1369 - 2405 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0025
--- Epoch 773 / 1369 - 2406 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0120
--- Epoch 774 / 1369 - 2407 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0045
--- Epoch 775 / 1369 - 2408 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0235
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0055
--- Epoch 776 / 1369 - 2409 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0172
Iteration 80, loss = 0.0058
--- Epoch 777 / 1369 - 2410 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0026
--- Epoch 778 / 1369 - 2411 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0085
--- Epoch 779 / 1369 - 2412 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0210
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0031
--- Epoch 780 / 1369 - 2413 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0024
--- Epoch 781 / 1369 - 2414 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0127
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0027
--- Epoch 782 / 1369 - 2415 epochs total
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0024
--- Epoch 783 / 1369 - 2416 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0157
Iteration 80, loss = 0.0033
--- Epoch 784 / 1369 - 2417 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0010
--- Epoch 785 / 1369 - 2418 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0036
--- Epoch 786 / 1369 - 2419 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0045
--- Epoch 787 / 1369 - 2420 epochs total
Iteration 0, loss = 0.0103
Iteration 20, loss = 0.0010
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0026
--- Epoch 788 / 1369 - 2421 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0011
--- Epoch 789 / 1369 - 2422 epochs total
Iteration 0, loss = 0.0200
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0128
Iteration 80, loss = 0.0039
--- Epoch 790 / 1369 - 2423 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0040
--- Epoch 791 / 1369 - 2424 epochs total
Iteration 0, loss = 0.0158
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0210
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0027
--- Epoch 792 / 1369 - 2425 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0127
Iteration 80, loss = 0.0052
--- Epoch 793 / 1369 - 2426 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0080
--- Epoch 794 / 1369 - 2427 epochs total
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0080
--- Epoch 795 / 1369 - 2428 epochs total
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0038
--- Epoch 796 / 1369 - 2429 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0023
--- Epoch 797 / 1369 - 2430 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0022
--- Epoch 798 / 1369 - 2431 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0054
--- Epoch 799 / 1369 - 2432 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0035
--- Epoch 800 / 1369 - 2433 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0013
--- Epoch 801 / 1369 - 2434 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0008
--- Epoch 802 / 1369 - 2435 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0013
--- Epoch 803 / 1369 - 2436 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0023
--- Epoch 804 / 1369 - 2437 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0136
--- Epoch 805 / 1369 - 2438 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0060
--- Epoch 806 / 1369 - 2439 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0008
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0050
--- Epoch 807 / 1369 - 2440 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0024
--- Epoch 808 / 1369 - 2441 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0050
--- Epoch 809 / 1369 - 2442 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0044
--- Epoch 810 / 1369 - 2443 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0279
Iteration 40, loss = 0.0253
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0037
--- Epoch 811 / 1369 - 2444 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0107
--- Epoch 812 / 1369 - 2445 epochs total
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0279
--- Epoch 813 / 1369 - 2446 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0158
--- Epoch 814 / 1369 - 2447 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0007
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0016
--- Epoch 815 / 1369 - 2448 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0020
--- Epoch 816 / 1369 - 2449 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0098
--- Epoch 817 / 1369 - 2450 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0022
--- Epoch 818 / 1369 - 2451 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0007
Iteration 80, loss = 0.0029
--- Epoch 819 / 1369 - 2452 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0050
--- Epoch 820 / 1369 - 2453 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0017
--- Epoch 821 / 1369 - 2454 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0006
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0063
--- Epoch 822 / 1369 - 2455 epochs total
Iteration 0, loss = 0.0205
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0021
--- Epoch 823 / 1369 - 2456 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0181
--- Epoch 824 / 1369 - 2457 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0067
--- Epoch 825 / 1369 - 2458 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0173
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0074
--- Epoch 826 / 1369 - 2459 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0171
Iteration 80, loss = 0.0058
--- Epoch 827 / 1369 - 2460 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0187
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0005
Iteration 80, loss = 0.0190
--- Epoch 828 / 1369 - 2461 epochs total
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0020
--- Epoch 829 / 1369 - 2462 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0026
--- Epoch 830 / 1369 - 2463 epochs total
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0021
--- Epoch 831 / 1369 - 2464 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0120
--- Epoch 832 / 1369 - 2465 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0016
--- Epoch 833 / 1369 - 2466 epochs total
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0005
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0008
--- Epoch 834 / 1369 - 2467 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0105
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0045
--- Epoch 835 / 1369 - 2468 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0056
--- Epoch 836 / 1369 - 2469 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0187
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0042
--- Epoch 837 / 1369 - 2470 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0047
--- Epoch 838 / 1369 - 2471 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0159
--- Epoch 839 / 1369 - 2472 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0042
--- Epoch 840 / 1369 - 2473 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0120
--- Epoch 841 / 1369 - 2474 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0033
--- Epoch 842 / 1369 - 2475 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0009
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0010
--- Epoch 843 / 1369 - 2476 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0005
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0023
--- Epoch 844 / 1369 - 2477 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0190
Iteration 60, loss = 0.0121
Iteration 80, loss = 0.0051
--- Epoch 845 / 1369 - 2478 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0036
--- Epoch 846 / 1369 - 2479 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0073
--- Epoch 847 / 1369 - 2480 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0074
--- Epoch 848 / 1369 - 2481 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0164
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0066
--- Epoch 849 / 1369 - 2482 epochs total
Iteration 0, loss = 0.0253
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0082
--- Epoch 850 / 1369 - 2483 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0021
--- Epoch 851 / 1369 - 2484 epochs total
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0146
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0007
--- Epoch 852 / 1369 - 2485 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0028
--- Epoch 853 / 1369 - 2486 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0007
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0055
--- Epoch 854 / 1369 - 2487 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0046
--- Epoch 855 / 1369 - 2488 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0005
Iteration 60, loss = 0.0192
Iteration 80, loss = 0.0060
--- Epoch 856 / 1369 - 2489 epochs total
Iteration 0, loss = 0.0223
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0017
--- Epoch 857 / 1369 - 2490 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0219
--- Epoch 858 / 1369 - 2491 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0146
--- Epoch 859 / 1369 - 2492 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0014
--- Epoch 860 / 1369 - 2493 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0012
--- Epoch 861 / 1369 - 2494 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0280
--- Epoch 862 / 1369 - 2495 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0016
--- Epoch 863 / 1369 - 2496 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0097
Iteration 80, loss = 0.0020
--- Epoch 864 / 1369 - 2497 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0032
--- Epoch 865 / 1369 - 2498 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0034
--- Epoch 866 / 1369 - 2499 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0036
--- Epoch 867 / 1369 - 2500 epochs total
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0400
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0047
--- Epoch 868 / 1369 - 2501 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0500
--- Epoch 869 / 1369 - 2502 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0020
--- Epoch 870 / 1369 - 2503 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0020
--- Epoch 871 / 1369 - 2504 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0122
--- Epoch 872 / 1369 - 2505 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0035
--- Epoch 873 / 1369 - 2506 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0007
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0012
--- Epoch 874 / 1369 - 2507 epochs total
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0078
--- Epoch 875 / 1369 - 2508 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0007
--- Epoch 876 / 1369 - 2509 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0022
--- Epoch 877 / 1369 - 2510 epochs total
Iteration 0, loss = 0.0190
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0014
--- Epoch 878 / 1369 - 2511 epochs total
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0059
--- Epoch 879 / 1369 - 2512 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0059
--- Epoch 880 / 1369 - 2513 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0170
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0022
--- Epoch 881 / 1369 - 2514 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0019
--- Epoch 882 / 1369 - 2515 epochs total
Iteration 0, loss = 0.0008
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0049
--- Epoch 883 / 1369 - 2516 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0121
--- Epoch 884 / 1369 - 2517 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0112
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0027
--- Epoch 885 / 1369 - 2518 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0110
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0015
--- Epoch 886 / 1369 - 2519 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0049
--- Epoch 887 / 1369 - 2520 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0007
Iteration 80, loss = 0.0013
--- Epoch 888 / 1369 - 2521 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0101
--- Epoch 889 / 1369 - 2522 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0020
--- Epoch 890 / 1369 - 2523 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0059
--- Epoch 891 / 1369 - 2524 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0029
--- Epoch 892 / 1369 - 2525 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0018
--- Epoch 893 / 1369 - 2526 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0027
--- Epoch 894 / 1369 - 2527 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0039
--- Epoch 895 / 1369 - 2528 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0237
Iteration 60, loss = 0.0184
Iteration 80, loss = 0.0059
--- Epoch 896 / 1369 - 2529 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0035
--- Epoch 897 / 1369 - 2530 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0010
--- Epoch 898 / 1369 - 2531 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0013
--- Epoch 899 / 1369 - 2532 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0375
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0005
--- Epoch 900 / 1369 - 2533 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0031
--- Epoch 901 / 1369 - 2534 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0013
--- Epoch 902 / 1369 - 2535 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0232
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0135
--- Epoch 903 / 1369 - 2536 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0127
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0083
--- Epoch 904 / 1369 - 2537 epochs total
Iteration 0, loss = 0.0226
Iteration 20, loss = 0.0410
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0121
--- Epoch 905 / 1369 - 2538 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0453
Iteration 80, loss = 0.0031
--- Epoch 906 / 1369 - 2539 epochs total
Iteration 0, loss = 0.0310
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0033
--- Epoch 907 / 1369 - 2540 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0048
--- Epoch 908 / 1369 - 2541 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0134
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0017
--- Epoch 909 / 1369 - 2542 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0021
--- Epoch 910 / 1369 - 2543 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0127
--- Epoch 911 / 1369 - 2544 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0029
--- Epoch 912 / 1369 - 2545 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0005
--- Epoch 913 / 1369 - 2546 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0014
--- Epoch 914 / 1369 - 2547 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0006
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0058
--- Epoch 915 / 1369 - 2548 epochs total
Iteration 0, loss = 0.0139
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0009
Iteration 80, loss = 0.0044
--- Epoch 916 / 1369 - 2549 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0025
--- Epoch 917 / 1369 - 2550 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0119
--- Epoch 918 / 1369 - 2551 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0043
--- Epoch 919 / 1369 - 2552 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0073
--- Epoch 920 / 1369 - 2553 epochs total
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0028
--- Epoch 921 / 1369 - 2554 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0159
Iteration 40, loss = 0.0256
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0014
--- Epoch 922 / 1369 - 2555 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0086
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0048
--- Epoch 923 / 1369 - 2556 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0046
--- Epoch 924 / 1369 - 2557 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0027
--- Epoch 925 / 1369 - 2558 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0025
--- Epoch 926 / 1369 - 2559 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0064
--- Epoch 927 / 1369 - 2560 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0048
--- Epoch 928 / 1369 - 2561 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0012
--- Epoch 929 / 1369 - 2562 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0023
--- Epoch 930 / 1369 - 2563 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0029
--- Epoch 931 / 1369 - 2564 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0194
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0128
Iteration 80, loss = 0.0051
--- Epoch 932 / 1369 - 2565 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0143
--- Epoch 933 / 1369 - 2566 epochs total
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0034
--- Epoch 934 / 1369 - 2567 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0378
Iteration 80, loss = 0.0055
--- Epoch 935 / 1369 - 2568 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0024
--- Epoch 936 / 1369 - 2569 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0157
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0024
--- Epoch 937 / 1369 - 2570 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0075
--- Epoch 938 / 1369 - 2571 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0036
--- Epoch 939 / 1369 - 2572 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0165
Iteration 80, loss = 0.0115
--- Epoch 940 / 1369 - 2573 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0192
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0032
--- Epoch 941 / 1369 - 2574 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0083
--- Epoch 942 / 1369 - 2575 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0222
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0036
--- Epoch 943 / 1369 - 2576 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0015
--- Epoch 944 / 1369 - 2577 epochs total
Iteration 0, loss = 0.0181
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0016
--- Epoch 945 / 1369 - 2578 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0018
--- Epoch 946 / 1369 - 2579 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0077
--- Epoch 947 / 1369 - 2580 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0093
--- Epoch 948 / 1369 - 2581 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0008
--- Epoch 949 / 1369 - 2582 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0094
--- Epoch 950 / 1369 - 2583 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0033
--- Epoch 951 / 1369 - 2584 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0110
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0128
--- Epoch 952 / 1369 - 2585 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0021
--- Epoch 953 / 1369 - 2586 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0015
--- Epoch 954 / 1369 - 2587 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0026
--- Epoch 955 / 1369 - 2588 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0129
Iteration 40, loss = 0.0333
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0121
--- Epoch 956 / 1369 - 2589 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0111
--- Epoch 957 / 1369 - 2590 epochs total
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0070
--- Epoch 958 / 1369 - 2591 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0084
--- Epoch 959 / 1369 - 2592 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0011
--- Epoch 960 / 1369 - 2593 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0062
--- Epoch 961 / 1369 - 2594 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0004
Iteration 80, loss = 0.0038
--- Epoch 962 / 1369 - 2595 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0075
--- Epoch 963 / 1369 - 2596 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0041
--- Epoch 964 / 1369 - 2597 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0061
--- Epoch 965 / 1369 - 2598 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0025
--- Epoch 966 / 1369 - 2599 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0063
--- Epoch 967 / 1369 - 2600 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0096
--- Epoch 968 / 1369 - 2601 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0020
--- Epoch 969 / 1369 - 2602 epochs total
Iteration 0, loss = 0.0191
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0007
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0185
--- Epoch 970 / 1369 - 2603 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0013
--- Epoch 971 / 1369 - 2604 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0040
--- Epoch 972 / 1369 - 2605 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0237
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0070
--- Epoch 973 / 1369 - 2606 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0032
--- Epoch 974 / 1369 - 2607 epochs total
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0022
--- Epoch 975 / 1369 - 2608 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0018
--- Epoch 976 / 1369 - 2609 epochs total
Iteration 0, loss = 0.0300
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0035
--- Epoch 977 / 1369 - 2610 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0108
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0094
--- Epoch 978 / 1369 - 2611 epochs total
Iteration 0, loss = 0.0006
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0123
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0021
--- Epoch 979 / 1369 - 2612 epochs total
Iteration 0, loss = 0.0007
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0007
--- Epoch 980 / 1369 - 2613 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0008
Iteration 80, loss = 0.0062
--- Epoch 981 / 1369 - 2614 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0008
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0242
--- Epoch 982 / 1369 - 2615 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0050
--- Epoch 983 / 1369 - 2616 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0026
--- Epoch 984 / 1369 - 2617 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0042
--- Epoch 985 / 1369 - 2618 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0031
--- Epoch 986 / 1369 - 2619 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0061
--- Epoch 987 / 1369 - 2620 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0202
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0030
--- Epoch 988 / 1369 - 2621 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0053
--- Epoch 989 / 1369 - 2622 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0007
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0014
--- Epoch 990 / 1369 - 2623 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0155
Iteration 80, loss = 0.0030
--- Epoch 991 / 1369 - 2624 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0206
Iteration 40, loss = 0.0078
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0026
--- Epoch 992 / 1369 - 2625 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0016
--- Epoch 993 / 1369 - 2626 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0059
--- Epoch 994 / 1369 - 2627 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0174
Iteration 80, loss = 0.0009
--- Epoch 995 / 1369 - 2628 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0036
--- Epoch 996 / 1369 - 2629 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0014
--- Epoch 997 / 1369 - 2630 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0070
--- Epoch 998 / 1369 - 2631 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0042
--- Epoch 999 / 1369 - 2632 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0035
--- Epoch 1000 / 1369 - 2633 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0062
--- Epoch 1001 / 1369 - 2634 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0210
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0010
--- Epoch 1002 / 1369 - 2635 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0028
--- Epoch 1003 / 1369 - 2636 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0035
--- Epoch 1004 / 1369 - 2637 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0020
--- Epoch 1005 / 1369 - 2638 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0076
--- Epoch 1006 / 1369 - 2639 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0186
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0020
--- Epoch 1007 / 1369 - 2640 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0099
--- Epoch 1008 / 1369 - 2641 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0280
Iteration 80, loss = 0.0097
--- Epoch 1009 / 1369 - 2642 epochs total
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0082
--- Epoch 1010 / 1369 - 2643 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0311
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0029
--- Epoch 1011 / 1369 - 2644 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0030
--- Epoch 1012 / 1369 - 2645 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0025
--- Epoch 1013 / 1369 - 2646 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0022
--- Epoch 1014 / 1369 - 2647 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0030
--- Epoch 1015 / 1369 - 2648 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0249
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0037
--- Epoch 1016 / 1369 - 2649 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0057
--- Epoch 1017 / 1369 - 2650 epochs total
Iteration 0, loss = 0.0158
Iteration 20, loss = 0.0007
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0281
Iteration 80, loss = 0.0023
--- Epoch 1018 / 1369 - 2651 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0040
--- Epoch 1019 / 1369 - 2652 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0021
--- Epoch 1020 / 1369 - 2653 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0038
--- Epoch 1021 / 1369 - 2654 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0136
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0042
--- Epoch 1022 / 1369 - 2655 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0012
--- Epoch 1023 / 1369 - 2656 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0032
--- Epoch 1024 / 1369 - 2657 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0072
--- Epoch 1025 / 1369 - 2658 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0162
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0235
--- Epoch 1026 / 1369 - 2659 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0055
--- Epoch 1027 / 1369 - 2660 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0060
--- Epoch 1028 / 1369 - 2661 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0005
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0174
Iteration 80, loss = 0.0060
--- Epoch 1029 / 1369 - 2662 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0024
--- Epoch 1030 / 1369 - 2663 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0112
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0039
--- Epoch 1031 / 1369 - 2664 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0240
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0132
--- Epoch 1032 / 1369 - 2665 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0174
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0016
--- Epoch 1033 / 1369 - 2666 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0018
--- Epoch 1034 / 1369 - 2667 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0021
--- Epoch 1035 / 1369 - 2668 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0145
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0057
--- Epoch 1036 / 1369 - 2669 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0107
--- Epoch 1037 / 1369 - 2670 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0137
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0037
--- Epoch 1038 / 1369 - 2671 epochs total
Iteration 0, loss = 0.0189
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0043
--- Epoch 1039 / 1369 - 2672 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0203
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0007
--- Epoch 1040 / 1369 - 2673 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0023
--- Epoch 1041 / 1369 - 2674 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0028
--- Epoch 1042 / 1369 - 2675 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0080
--- Epoch 1043 / 1369 - 2676 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0096
--- Epoch 1044 / 1369 - 2677 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0037
--- Epoch 1045 / 1369 - 2678 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0025
--- Epoch 1046 / 1369 - 2679 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0029
--- Epoch 1047 / 1369 - 2680 epochs total
Iteration 0, loss = 0.0007
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0037
--- Epoch 1048 / 1369 - 2681 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0037
--- Epoch 1049 / 1369 - 2682 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0019
--- Epoch 1050 / 1369 - 2683 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0009
Iteration 80, loss = 0.0070
--- Epoch 1051 / 1369 - 2684 epochs total
Iteration 0, loss = 0.0178
Iteration 20, loss = 0.0065
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0172
Iteration 80, loss = 0.0015
--- Epoch 1052 / 1369 - 2685 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0021
--- Epoch 1053 / 1369 - 2686 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0212
Iteration 60, loss = 0.0127
Iteration 80, loss = 0.0021
--- Epoch 1054 / 1369 - 2687 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0029
--- Epoch 1055 / 1369 - 2688 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0017
--- Epoch 1056 / 1369 - 2689 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0115
--- Epoch 1057 / 1369 - 2690 epochs total
Iteration 0, loss = 0.0284
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0085
--- Epoch 1058 / 1369 - 2691 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0011
--- Epoch 1059 / 1369 - 2692 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0026
--- Epoch 1060 / 1369 - 2693 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0035
--- Epoch 1061 / 1369 - 2694 epochs total
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0029
--- Epoch 1062 / 1369 - 2695 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0027
--- Epoch 1063 / 1369 - 2696 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0180
Iteration 80, loss = 0.0102
--- Epoch 1064 / 1369 - 2697 epochs total
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0173
--- Epoch 1065 / 1369 - 2698 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0181
Iteration 40, loss = 0.0284
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0098
--- Epoch 1066 / 1369 - 2699 epochs total
Iteration 0, loss = 0.0082
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0043
--- Epoch 1067 / 1369 - 2700 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0028
--- Epoch 1068 / 1369 - 2701 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0018
--- Epoch 1069 / 1369 - 2702 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0079
--- Epoch 1070 / 1369 - 2703 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0041
--- Epoch 1071 / 1369 - 2704 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0086
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0019
--- Epoch 1072 / 1369 - 2705 epochs total
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0006
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0192
--- Epoch 1073 / 1369 - 2706 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0138
--- Epoch 1074 / 1369 - 2707 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0059
--- Epoch 1075 / 1369 - 2708 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0100
--- Epoch 1076 / 1369 - 2709 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0045
--- Epoch 1077 / 1369 - 2710 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0024
--- Epoch 1078 / 1369 - 2711 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0095
--- Epoch 1079 / 1369 - 2712 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0027
--- Epoch 1080 / 1369 - 2713 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0235
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0025
--- Epoch 1081 / 1369 - 2714 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0046
--- Epoch 1082 / 1369 - 2715 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0105
Iteration 60, loss = 0.0177
Iteration 80, loss = 0.0019
--- Epoch 1083 / 1369 - 2716 epochs total
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0045
--- Epoch 1084 / 1369 - 2717 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0161
Iteration 80, loss = 0.0497
--- Epoch 1085 / 1369 - 2718 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0016
--- Epoch 1086 / 1369 - 2719 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0118
--- Epoch 1087 / 1369 - 2720 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0017
--- Epoch 1088 / 1369 - 2721 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0041
--- Epoch 1089 / 1369 - 2722 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0028
--- Epoch 1090 / 1369 - 2723 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0026
--- Epoch 1091 / 1369 - 2724 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0130
--- Epoch 1092 / 1369 - 2725 epochs total
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0011
--- Epoch 1093 / 1369 - 2726 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0083
--- Epoch 1094 / 1369 - 2727 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0125
--- Epoch 1095 / 1369 - 2728 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0114
--- Epoch 1096 / 1369 - 2729 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0033
--- Epoch 1097 / 1369 - 2730 epochs total
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0053
--- Epoch 1098 / 1369 - 2731 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0022
--- Epoch 1099 / 1369 - 2732 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0116
--- Epoch 1100 / 1369 - 2733 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0175
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0028
--- Epoch 1101 / 1369 - 2734 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0025
--- Epoch 1102 / 1369 - 2735 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0157
Iteration 60, loss = 0.0127
Iteration 80, loss = 0.0026
--- Epoch 1103 / 1369 - 2736 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0013
--- Epoch 1104 / 1369 - 2737 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0168
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0016
--- Epoch 1105 / 1369 - 2738 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0175
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0148
--- Epoch 1106 / 1369 - 2739 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0378
Iteration 80, loss = 0.0023
--- Epoch 1107 / 1369 - 2740 epochs total
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0038
--- Epoch 1108 / 1369 - 2741 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0039
--- Epoch 1109 / 1369 - 2742 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0007
--- Epoch 1110 / 1369 - 2743 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0005
--- Epoch 1111 / 1369 - 2744 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0010
--- Epoch 1112 / 1369 - 2745 epochs total
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0172
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0159
--- Epoch 1113 / 1369 - 2746 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0018
--- Epoch 1114 / 1369 - 2747 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0088
--- Epoch 1115 / 1369 - 2748 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0032
--- Epoch 1116 / 1369 - 2749 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0098
--- Epoch 1117 / 1369 - 2750 epochs total
Iteration 0, loss = 0.0123
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0008
--- Epoch 1118 / 1369 - 2751 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0023
--- Epoch 1119 / 1369 - 2752 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0094
--- Epoch 1120 / 1369 - 2753 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0282
Iteration 80, loss = 0.0012
--- Epoch 1121 / 1369 - 2754 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0103
--- Epoch 1122 / 1369 - 2755 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0023
--- Epoch 1123 / 1369 - 2756 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0040
--- Epoch 1124 / 1369 - 2757 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0039
--- Epoch 1125 / 1369 - 2758 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0035
--- Epoch 1126 / 1369 - 2759 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0044
--- Epoch 1127 / 1369 - 2760 epochs total
Iteration 0, loss = 0.0192
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0051
--- Epoch 1128 / 1369 - 2761 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0070
--- Epoch 1129 / 1369 - 2762 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0170
Iteration 80, loss = 0.0091
--- Epoch 1130 / 1369 - 2763 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0079
--- Epoch 1131 / 1369 - 2764 epochs total
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0045
--- Epoch 1132 / 1369 - 2765 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0068
--- Epoch 1133 / 1369 - 2766 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0186
--- Epoch 1134 / 1369 - 2767 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0052
--- Epoch 1135 / 1369 - 2768 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0019
--- Epoch 1136 / 1369 - 2769 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0168
--- Epoch 1137 / 1369 - 2770 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0181
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0135
--- Epoch 1138 / 1369 - 2771 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0123
Iteration 80, loss = 0.0031
--- Epoch 1139 / 1369 - 2772 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0016
--- Epoch 1140 / 1369 - 2773 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0029
--- Epoch 1141 / 1369 - 2774 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0023
--- Epoch 1142 / 1369 - 2775 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0007
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0049
--- Epoch 1143 / 1369 - 2776 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0006
--- Epoch 1144 / 1369 - 2777 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0009
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0113
--- Epoch 1145 / 1369 - 2778 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0071
--- Epoch 1146 / 1369 - 2779 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0007
Iteration 80, loss = 0.0050
--- Epoch 1147 / 1369 - 2780 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0042
--- Epoch 1148 / 1369 - 2781 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0131
--- Epoch 1149 / 1369 - 2782 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0112
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0018
--- Epoch 1150 / 1369 - 2783 epochs total
Iteration 0, loss = 0.0157
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0156
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0032
--- Epoch 1151 / 1369 - 2784 epochs total
Iteration 0, loss = 0.0218
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0063
--- Epoch 1152 / 1369 - 2785 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0149
--- Epoch 1153 / 1369 - 2786 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0028
--- Epoch 1154 / 1369 - 2787 epochs total
Iteration 0, loss = 0.0103
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0104
--- Epoch 1155 / 1369 - 2788 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0029
--- Epoch 1156 / 1369 - 2789 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0042
--- Epoch 1157 / 1369 - 2790 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0051
--- Epoch 1158 / 1369 - 2791 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0010
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0041
--- Epoch 1159 / 1369 - 2792 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0023
--- Epoch 1160 / 1369 - 2793 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0025
--- Epoch 1161 / 1369 - 2794 epochs total
Iteration 0, loss = 0.0292
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0015
--- Epoch 1162 / 1369 - 2795 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0067
--- Epoch 1163 / 1369 - 2796 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0202
--- Epoch 1164 / 1369 - 2797 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0093
--- Epoch 1165 / 1369 - 2798 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0028
--- Epoch 1166 / 1369 - 2799 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0142
Iteration 80, loss = 0.0023
--- Epoch 1167 / 1369 - 2800 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0012
--- Epoch 1168 / 1369 - 2801 epochs total
Iteration 0, loss = 0.0203
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0012
--- Epoch 1169 / 1369 - 2802 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0103
--- Epoch 1170 / 1369 - 2803 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0034
--- Epoch 1171 / 1369 - 2804 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0184
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0018
--- Epoch 1172 / 1369 - 2805 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0030
--- Epoch 1173 / 1369 - 2806 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0014
--- Epoch 1174 / 1369 - 2807 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0190
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0058
--- Epoch 1175 / 1369 - 2808 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0082
--- Epoch 1176 / 1369 - 2809 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0009
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0027
--- Epoch 1177 / 1369 - 2810 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0190
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0025
--- Epoch 1178 / 1369 - 2811 epochs total
Iteration 0, loss = 0.0103
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0043
--- Epoch 1179 / 1369 - 2812 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0012
--- Epoch 1180 / 1369 - 2813 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0107
--- Epoch 1181 / 1369 - 2814 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0023
--- Epoch 1182 / 1369 - 2815 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0128
--- Epoch 1183 / 1369 - 2816 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0156
--- Epoch 1184 / 1369 - 2817 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0015
--- Epoch 1185 / 1369 - 2818 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0008
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0035
--- Epoch 1186 / 1369 - 2819 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0129
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0037
--- Epoch 1187 / 1369 - 2820 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0039
--- Epoch 1188 / 1369 - 2821 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0099
--- Epoch 1189 / 1369 - 2822 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0164
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0032
--- Epoch 1190 / 1369 - 2823 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0015
--- Epoch 1191 / 1369 - 2824 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0085
--- Epoch 1192 / 1369 - 2825 epochs total
Iteration 0, loss = 0.0137
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0008
--- Epoch 1193 / 1369 - 2826 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0014
--- Epoch 1194 / 1369 - 2827 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0056
--- Epoch 1195 / 1369 - 2828 epochs total
Iteration 0, loss = 0.0170
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0051
--- Epoch 1196 / 1369 - 2829 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0172
--- Epoch 1197 / 1369 - 2830 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0184
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0028
--- Epoch 1198 / 1369 - 2831 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0029
--- Epoch 1199 / 1369 - 2832 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0038
--- Epoch 1200 / 1369 - 2833 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0057
--- Epoch 1201 / 1369 - 2834 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0065
--- Epoch 1202 / 1369 - 2835 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0019
--- Epoch 1203 / 1369 - 2836 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0117
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0020
--- Epoch 1204 / 1369 - 2837 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0145
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0153
--- Epoch 1205 / 1369 - 2838 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0019
--- Epoch 1206 / 1369 - 2839 epochs total
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0061
--- Epoch 1207 / 1369 - 2840 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0311
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0025
--- Epoch 1208 / 1369 - 2841 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0007
Iteration 80, loss = 0.0036
--- Epoch 1209 / 1369 - 2842 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0063
--- Epoch 1210 / 1369 - 2843 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0124
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0050
--- Epoch 1211 / 1369 - 2844 epochs total
Iteration 0, loss = 0.0294
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0039
--- Epoch 1212 / 1369 - 2845 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0069
--- Epoch 1213 / 1369 - 2846 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0005
Iteration 40, loss = 0.0162
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0030
--- Epoch 1214 / 1369 - 2847 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0021
--- Epoch 1215 / 1369 - 2848 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0227
--- Epoch 1216 / 1369 - 2849 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0319
--- Epoch 1217 / 1369 - 2850 epochs total
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0058
--- Epoch 1218 / 1369 - 2851 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0064
--- Epoch 1219 / 1369 - 2852 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0192
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0018
--- Epoch 1220 / 1369 - 2853 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0022
--- Epoch 1221 / 1369 - 2854 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0023
--- Epoch 1222 / 1369 - 2855 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0096
--- Epoch 1223 / 1369 - 2856 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0192
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0018
--- Epoch 1224 / 1369 - 2857 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0005
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0031
--- Epoch 1225 / 1369 - 2858 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0081
--- Epoch 1226 / 1369 - 2859 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0039
--- Epoch 1227 / 1369 - 2860 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0006
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0076
--- Epoch 1228 / 1369 - 2861 epochs total
Iteration 0, loss = 0.0084
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0020
--- Epoch 1229 / 1369 - 2862 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0054
--- Epoch 1230 / 1369 - 2863 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0069
--- Epoch 1231 / 1369 - 2864 epochs total
Iteration 0, loss = 0.0120
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0008
Iteration 80, loss = 0.0020
--- Epoch 1232 / 1369 - 2865 epochs total
Iteration 0, loss = 0.0084
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0055
--- Epoch 1233 / 1369 - 2866 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0025
--- Epoch 1234 / 1369 - 2867 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0007
Iteration 80, loss = 0.0041
--- Epoch 1235 / 1369 - 2868 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0023
--- Epoch 1236 / 1369 - 2869 epochs total
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0016
--- Epoch 1237 / 1369 - 2870 epochs total
Iteration 0, loss = 0.0130
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0063
--- Epoch 1238 / 1369 - 2871 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0122
--- Epoch 1239 / 1369 - 2872 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0090
--- Epoch 1240 / 1369 - 2873 epochs total
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0022
--- Epoch 1241 / 1369 - 2874 epochs total
Iteration 0, loss = 0.0375
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0055
--- Epoch 1242 / 1369 - 2875 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0047
--- Epoch 1243 / 1369 - 2876 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0099
--- Epoch 1244 / 1369 - 2877 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0025
--- Epoch 1245 / 1369 - 2878 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0178
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0040
--- Epoch 1246 / 1369 - 2879 epochs total
Iteration 0, loss = 0.0252
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0043
--- Epoch 1247 / 1369 - 2880 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0016
--- Epoch 1248 / 1369 - 2881 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0007
Iteration 80, loss = 0.0023
--- Epoch 1249 / 1369 - 2882 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0127
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0068
--- Epoch 1250 / 1369 - 2883 epochs total
Iteration 0, loss = 0.0171
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0039
--- Epoch 1251 / 1369 - 2884 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0012
--- Epoch 1252 / 1369 - 2885 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0022
--- Epoch 1253 / 1369 - 2886 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0250
Iteration 80, loss = 0.0081
--- Epoch 1254 / 1369 - 2887 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0039
--- Epoch 1255 / 1369 - 2888 epochs total
Iteration 0, loss = 0.0135
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0077
--- Epoch 1256 / 1369 - 2889 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0015
--- Epoch 1257 / 1369 - 2890 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0024
--- Epoch 1258 / 1369 - 2891 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0009
--- Epoch 1259 / 1369 - 2892 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0024
--- Epoch 1260 / 1369 - 2893 epochs total
Iteration 0, loss = 0.0128
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0108
--- Epoch 1261 / 1369 - 2894 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0023
--- Epoch 1262 / 1369 - 2895 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0083
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0052
--- Epoch 1263 / 1369 - 2896 epochs total
Iteration 0, loss = 0.0005
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0057
--- Epoch 1264 / 1369 - 2897 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0023
--- Epoch 1265 / 1369 - 2898 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0264
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0151
Iteration 80, loss = 0.0028
--- Epoch 1266 / 1369 - 2899 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0034
--- Epoch 1267 / 1369 - 2900 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0034
--- Epoch 1268 / 1369 - 2901 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0056
--- Epoch 1269 / 1369 - 2902 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0031
--- Epoch 1270 / 1369 - 2903 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0095
--- Epoch 1271 / 1369 - 2904 epochs total
Iteration 0, loss = 0.0210
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0005
Iteration 80, loss = 0.0009
--- Epoch 1272 / 1369 - 2905 epochs total
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0058
--- Epoch 1273 / 1369 - 2906 epochs total
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0093
--- Epoch 1274 / 1369 - 2907 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0102
--- Epoch 1275 / 1369 - 2908 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0031
--- Epoch 1276 / 1369 - 2909 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0026
--- Epoch 1277 / 1369 - 2910 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0100
--- Epoch 1278 / 1369 - 2911 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0041
--- Epoch 1279 / 1369 - 2912 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0138
--- Epoch 1280 / 1369 - 2913 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0022
--- Epoch 1281 / 1369 - 2914 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0015
--- Epoch 1282 / 1369 - 2915 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0129
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0050
--- Epoch 1283 / 1369 - 2916 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0023
--- Epoch 1284 / 1369 - 2917 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0012
--- Epoch 1285 / 1369 - 2918 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0008
Iteration 80, loss = 0.0156
--- Epoch 1286 / 1369 - 2919 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0049
--- Epoch 1287 / 1369 - 2920 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0375
Iteration 40, loss = 0.0141
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0017
--- Epoch 1288 / 1369 - 2921 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0035
--- Epoch 1289 / 1369 - 2922 epochs total
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0024
--- Epoch 1290 / 1369 - 2923 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0040
--- Epoch 1291 / 1369 - 2924 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0044
--- Epoch 1292 / 1369 - 2925 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0024
--- Epoch 1293 / 1369 - 2926 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0024
--- Epoch 1294 / 1369 - 2927 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0033
--- Epoch 1295 / 1369 - 2928 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0131
--- Epoch 1296 / 1369 - 2929 epochs total
Iteration 0, loss = 0.0127
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0015
--- Epoch 1297 / 1369 - 2930 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0037
--- Epoch 1298 / 1369 - 2931 epochs total
Iteration 0, loss = 0.0131
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0053
--- Epoch 1299 / 1369 - 2932 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0170
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0009
Iteration 80, loss = 0.0087
--- Epoch 1300 / 1369 - 2933 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0132
--- Epoch 1301 / 1369 - 2934 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0021
--- Epoch 1302 / 1369 - 2935 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0173
Iteration 80, loss = 0.0059
--- Epoch 1303 / 1369 - 2936 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0041
--- Epoch 1304 / 1369 - 2937 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0051
--- Epoch 1305 / 1369 - 2938 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0025
--- Epoch 1306 / 1369 - 2939 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0033
--- Epoch 1307 / 1369 - 2940 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0056
--- Epoch 1308 / 1369 - 2941 epochs total
Iteration 0, loss = 0.0013
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0029
--- Epoch 1309 / 1369 - 2942 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0410
Iteration 80, loss = 0.0018
--- Epoch 1310 / 1369 - 2943 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0051
--- Epoch 1311 / 1369 - 2944 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0022
--- Epoch 1312 / 1369 - 2945 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0041
--- Epoch 1313 / 1369 - 2946 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0030
--- Epoch 1314 / 1369 - 2947 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0012
--- Epoch 1315 / 1369 - 2948 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0019
--- Epoch 1316 / 1369 - 2949 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0125
Iteration 80, loss = 0.0093
--- Epoch 1317 / 1369 - 2950 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0028
--- Epoch 1318 / 1369 - 2951 epochs total
Iteration 0, loss = 0.0208
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0012
--- Epoch 1319 / 1369 - 2952 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0016
--- Epoch 1320 / 1369 - 2953 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0071
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0014
--- Epoch 1321 / 1369 - 2954 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0029
--- Epoch 1322 / 1369 - 2955 epochs total
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0031
--- Epoch 1323 / 1369 - 2956 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0069
--- Epoch 1324 / 1369 - 2957 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0070
--- Epoch 1325 / 1369 - 2958 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0183
--- Epoch 1326 / 1369 - 2959 epochs total
Iteration 0, loss = 0.0007
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0064
--- Epoch 1327 / 1369 - 2960 epochs total
Iteration 0, loss = 0.0145
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0034
--- Epoch 1328 / 1369 - 2961 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0280
--- Epoch 1329 / 1369 - 2962 epochs total
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0025
--- Epoch 1330 / 1369 - 2963 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0508
Iteration 80, loss = 0.0051
--- Epoch 1331 / 1369 - 2964 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0009
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0011
--- Epoch 1332 / 1369 - 2965 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0020
--- Epoch 1333 / 1369 - 2966 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0049
--- Epoch 1334 / 1369 - 2967 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0123
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0018
--- Epoch 1335 / 1369 - 2968 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0031
--- Epoch 1336 / 1369 - 2969 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0026
--- Epoch 1337 / 1369 - 2970 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0010
Iteration 80, loss = 0.0015
--- Epoch 1338 / 1369 - 2971 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0009
Iteration 80, loss = 0.0059
--- Epoch 1339 / 1369 - 2972 epochs total
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0013
--- Epoch 1340 / 1369 - 2973 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0022
--- Epoch 1341 / 1369 - 2974 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0012
--- Epoch 1342 / 1369 - 2975 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0081
--- Epoch 1343 / 1369 - 2976 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0157
--- Epoch 1344 / 1369 - 2977 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0038
--- Epoch 1345 / 1369 - 2978 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0010
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0007
Iteration 80, loss = 0.0013
--- Epoch 1346 / 1369 - 2979 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0102
--- Epoch 1347 / 1369 - 2980 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0057
--- Epoch 1348 / 1369 - 2981 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0121
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0195
--- Epoch 1349 / 1369 - 2982 epochs total
Iteration 0, loss = 0.0009
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0050
--- Epoch 1350 / 1369 - 2983 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0132
--- Epoch 1351 / 1369 - 2984 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0033
--- Epoch 1352 / 1369 - 2985 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0188
Iteration 80, loss = 0.0028
--- Epoch 1353 / 1369 - 2986 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0010
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0030
--- Epoch 1354 / 1369 - 2987 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0062
--- Epoch 1355 / 1369 - 2988 epochs total
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0005
Iteration 80, loss = 0.0044
--- Epoch 1356 / 1369 - 2989 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0067
--- Epoch 1357 / 1369 - 2990 epochs total
Iteration 0, loss = 0.0173
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0011
--- Epoch 1358 / 1369 - 2991 epochs total
Iteration 0, loss = 0.0151
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0026
--- Epoch 1359 / 1369 - 2992 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0414
Iteration 80, loss = 0.0047
--- Epoch 1360 / 1369 - 2993 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0156
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0104
--- Epoch 1361 / 1369 - 2994 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0033
--- Epoch 1362 / 1369 - 2995 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0016
--- Epoch 1363 / 1369 - 2996 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0121
--- Epoch 1364 / 1369 - 2997 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0138
Iteration 80, loss = 0.0033
--- Epoch 1365 / 1369 - 2998 epochs total
Iteration 0, loss = 0.0127
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0107
--- Epoch 1366 / 1369 - 2999 epochs total
Iteration 0, loss = 0.0120
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0081
--- Epoch 1367 / 1369 - 3000 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0154
Iteration 80, loss = 0.0058
--- Epoch 1368 / 1369 - 3001 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0190
Iteration 80, loss = 0.0012
--- Epoch 1369 / 1369 - 3002 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0021
In [137]:
testModel(model13, x_test=data["X_test_truck"], y_test=data["y_test_truck"], criterion=nn.MSELoss())
In [138]:
learning_rate = 1e-2
model14 = ConvNet4()
optimizer = optim.SGD(model14.parameters(), lr=learning_rate)
In [161]:
train(model14, optimizer, epochs=100000, x_train=data["X_train"],  y_train=data["y_train"], criterion=nn.MSELoss())
--- Epoch 1 / 100000 - 2449 epochs total
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0238
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0043
--- Epoch 2 / 100000 - 2450 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0187
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0032
--- Epoch 3 / 100000 - 2451 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0462
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0043
--- Epoch 4 / 100000 - 2452 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0051
--- Epoch 5 / 100000 - 2453 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0027
--- Epoch 6 / 100000 - 2454 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0065
--- Epoch 7 / 100000 - 2455 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0129
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0023
--- Epoch 8 / 100000 - 2456 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0051
--- Epoch 9 / 100000 - 2457 epochs total
Iteration 0, loss = 0.0193
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0148
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0173
--- Epoch 10 / 100000 - 2458 epochs total
Iteration 0, loss = 0.0123
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0032
--- Epoch 11 / 100000 - 2459 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0248
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0337
--- Epoch 12 / 100000 - 2460 epochs total
Iteration 0, loss = 0.0199
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0116
Iteration 80, loss = 0.0380
--- Epoch 13 / 100000 - 2461 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0168
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0108
--- Epoch 14 / 100000 - 2462 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0037
--- Epoch 15 / 100000 - 2463 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0187
Iteration 40, loss = 0.0193
Iteration 60, loss = 0.0126
Iteration 80, loss = 0.0161
--- Epoch 16 / 100000 - 2464 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0331
Iteration 80, loss = 0.0037
--- Epoch 17 / 100000 - 2465 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0191
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0052
--- Epoch 18 / 100000 - 2466 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0207
--- Epoch 19 / 100000 - 2467 epochs total
Iteration 0, loss = 0.0358
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0040
--- Epoch 20 / 100000 - 2468 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0138
--- Epoch 21 / 100000 - 2469 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0265
Iteration 80, loss = 0.0090
--- Epoch 22 / 100000 - 2470 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0025
--- Epoch 23 / 100000 - 2471 epochs total
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0334
--- Epoch 24 / 100000 - 2472 epochs total
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0040
--- Epoch 25 / 100000 - 2473 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0064
--- Epoch 26 / 100000 - 2474 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0032
--- Epoch 27 / 100000 - 2475 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0144
--- Epoch 28 / 100000 - 2476 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0090
--- Epoch 29 / 100000 - 2477 epochs total
Iteration 0, loss = 0.0334
Iteration 20, loss = 0.0195
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0272
Iteration 80, loss = 0.0018
--- Epoch 30 / 100000 - 2478 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0206
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0050
--- Epoch 31 / 100000 - 2479 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0120
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0134
--- Epoch 32 / 100000 - 2480 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0133
Iteration 80, loss = 0.0033
--- Epoch 33 / 100000 - 2481 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0357
Iteration 40, loss = 0.0198
Iteration 60, loss = 0.0373
Iteration 80, loss = 0.0118
--- Epoch 34 / 100000 - 2482 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0108
Iteration 40, loss = 0.0309
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0014
--- Epoch 35 / 100000 - 2483 epochs total
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0043
--- Epoch 36 / 100000 - 2484 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0195
Iteration 80, loss = 0.0019
--- Epoch 37 / 100000 - 2485 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0031
--- Epoch 38 / 100000 - 2486 epochs total
Iteration 0, loss = 0.0130
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0075
--- Epoch 39 / 100000 - 2487 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0112
Iteration 40, loss = 0.0202
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0107
--- Epoch 40 / 100000 - 2488 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0103
--- Epoch 41 / 100000 - 2489 epochs total
Iteration 0, loss = 0.0153
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0050
--- Epoch 42 / 100000 - 2490 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0135
--- Epoch 43 / 100000 - 2491 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0116
Iteration 80, loss = 0.0367
--- Epoch 44 / 100000 - 2492 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0039
--- Epoch 45 / 100000 - 2493 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0342
Iteration 80, loss = 0.0319
--- Epoch 46 / 100000 - 2494 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0048
--- Epoch 47 / 100000 - 2495 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0291
Iteration 80, loss = 0.0039
--- Epoch 48 / 100000 - 2496 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0220
Iteration 60, loss = 0.0108
Iteration 80, loss = 0.0243
--- Epoch 49 / 100000 - 2497 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0418
Iteration 80, loss = 0.0075
--- Epoch 50 / 100000 - 2498 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0141
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0037
--- Epoch 51 / 100000 - 2499 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0141
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0024
--- Epoch 52 / 100000 - 2500 epochs total
Iteration 0, loss = 0.0185
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0354
Iteration 60, loss = 0.0471
Iteration 80, loss = 0.0094
--- Epoch 53 / 100000 - 2501 epochs total
Iteration 0, loss = 0.0082
Iteration 20, loss = 0.0901
Iteration 40, loss = 0.0232
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0045
--- Epoch 54 / 100000 - 2502 epochs total
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0088
--- Epoch 55 / 100000 - 2503 epochs total
Iteration 0, loss = 0.0123
Iteration 20, loss = 0.0128
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0186
--- Epoch 56 / 100000 - 2504 epochs total
Iteration 0, loss = 0.0333
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0191
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0087
--- Epoch 57 / 100000 - 2505 epochs total
Iteration 0, loss = 0.0469
Iteration 20, loss = 0.0514
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0114
--- Epoch 58 / 100000 - 2506 epochs total
Iteration 0, loss = 0.0097
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0184
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0106
--- Epoch 59 / 100000 - 2507 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0821
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0029
--- Epoch 60 / 100000 - 2508 epochs total
Iteration 0, loss = 0.0290
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0018
--- Epoch 61 / 100000 - 2509 epochs total
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0378
Iteration 80, loss = 0.0080
--- Epoch 62 / 100000 - 2510 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0657
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0156
--- Epoch 63 / 100000 - 2511 epochs total
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0045
--- Epoch 64 / 100000 - 2512 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0237
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0165
--- Epoch 65 / 100000 - 2513 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0038
--- Epoch 66 / 100000 - 2514 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0181
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0041
--- Epoch 67 / 100000 - 2515 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0023
--- Epoch 68 / 100000 - 2516 epochs total
Iteration 0, loss = 0.0174
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0533
--- Epoch 69 / 100000 - 2517 epochs total
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0491
--- Epoch 70 / 100000 - 2518 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0379
--- Epoch 71 / 100000 - 2519 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0396
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0107
--- Epoch 72 / 100000 - 2520 epochs total
Iteration 0, loss = 0.0333
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0052
--- Epoch 73 / 100000 - 2521 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0050
--- Epoch 74 / 100000 - 2522 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0277
Iteration 80, loss = 0.0069
--- Epoch 75 / 100000 - 2523 epochs total
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0062
--- Epoch 76 / 100000 - 2524 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0205
Iteration 80, loss = 0.0122
--- Epoch 77 / 100000 - 2525 epochs total
Iteration 0, loss = 0.0284
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0034
--- Epoch 78 / 100000 - 2526 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0333
Iteration 80, loss = 0.0034
--- Epoch 79 / 100000 - 2527 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0071
--- Epoch 80 / 100000 - 2528 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0450
--- Epoch 81 / 100000 - 2529 epochs total
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0059
--- Epoch 82 / 100000 - 2530 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0266
Iteration 80, loss = 0.0061
--- Epoch 83 / 100000 - 2531 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0173
Iteration 80, loss = 0.0150
--- Epoch 84 / 100000 - 2532 epochs total
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0043
--- Epoch 85 / 100000 - 2533 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0523
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0030
--- Epoch 86 / 100000 - 2534 epochs total
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0144
Iteration 40, loss = 0.0357
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0248
--- Epoch 87 / 100000 - 2535 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0148
Iteration 60, loss = 0.0101
Iteration 80, loss = 0.0087
--- Epoch 88 / 100000 - 2536 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0040
--- Epoch 89 / 100000 - 2537 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0122
--- Epoch 90 / 100000 - 2538 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0286
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0071
--- Epoch 91 / 100000 - 2539 epochs total
Iteration 0, loss = 0.0206
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0039
--- Epoch 92 / 100000 - 2540 epochs total
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0051
--- Epoch 93 / 100000 - 2541 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0108
--- Epoch 94 / 100000 - 2542 epochs total
Iteration 0, loss = 0.0291
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0165
--- Epoch 95 / 100000 - 2543 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0238
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0091
--- Epoch 96 / 100000 - 2544 epochs total
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0271
Iteration 80, loss = 0.0170
--- Epoch 97 / 100000 - 2545 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0168
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0127
--- Epoch 98 / 100000 - 2546 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0231
--- Epoch 99 / 100000 - 2547 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0124
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0345
Iteration 80, loss = 0.0081
--- Epoch 100 / 100000 - 2548 epochs total
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0147
Iteration 40, loss = 0.0139
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0200
--- Epoch 101 / 100000 - 2549 epochs total
Iteration 0, loss = 0.0126
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0228
Iteration 80, loss = 0.0025
--- Epoch 102 / 100000 - 2550 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0049
--- Epoch 103 / 100000 - 2551 epochs total
Iteration 0, loss = 0.0551
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0013
--- Epoch 104 / 100000 - 2552 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0227
Iteration 80, loss = 0.0034
--- Epoch 105 / 100000 - 2553 epochs total
Iteration 0, loss = 0.0280
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0038
--- Epoch 106 / 100000 - 2554 epochs total
Iteration 0, loss = 0.0084
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0026
--- Epoch 107 / 100000 - 2555 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0336
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0066
--- Epoch 108 / 100000 - 2556 epochs total
Iteration 0, loss = 0.0235
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0079
--- Epoch 109 / 100000 - 2557 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0020
--- Epoch 110 / 100000 - 2558 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0197
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0103
--- Epoch 111 / 100000 - 2559 epochs total
Iteration 0, loss = 0.0103
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0077
--- Epoch 112 / 100000 - 2560 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0104
--- Epoch 113 / 100000 - 2561 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0259
Iteration 80, loss = 0.0112
--- Epoch 114 / 100000 - 2562 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0135
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0110
--- Epoch 115 / 100000 - 2563 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0029
--- Epoch 116 / 100000 - 2564 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0114
--- Epoch 117 / 100000 - 2565 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0159
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0008
--- Epoch 118 / 100000 - 2566 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0147
--- Epoch 119 / 100000 - 2567 epochs total
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0259
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0127
Iteration 80, loss = 0.0035
--- Epoch 120 / 100000 - 2568 epochs total
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0304
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0155
Iteration 80, loss = 0.0150
--- Epoch 121 / 100000 - 2569 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0140
--- Epoch 122 / 100000 - 2570 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0451
Iteration 40, loss = 0.0242
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0050
--- Epoch 123 / 100000 - 2571 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0404
Iteration 80, loss = 0.0134
--- Epoch 124 / 100000 - 2572 epochs total
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0049
--- Epoch 125 / 100000 - 2573 epochs total
Iteration 0, loss = 0.0368
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0142
Iteration 80, loss = 0.0121
--- Epoch 126 / 100000 - 2574 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0083
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0070
--- Epoch 127 / 100000 - 2575 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0305
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0311
Iteration 80, loss = 0.0091
--- Epoch 128 / 100000 - 2576 epochs total
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0350
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0156
--- Epoch 129 / 100000 - 2577 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0180
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0007
Iteration 80, loss = 0.0040
--- Epoch 130 / 100000 - 2578 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0304
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0099
--- Epoch 131 / 100000 - 2579 epochs total
Iteration 0, loss = 0.0191
Iteration 20, loss = 0.0172
Iteration 40, loss = 0.0193
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0138
--- Epoch 132 / 100000 - 2580 epochs total
Iteration 0, loss = 0.0413
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0062
--- Epoch 133 / 100000 - 2581 epochs total
Iteration 0, loss = 0.0084
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0043
--- Epoch 134 / 100000 - 2582 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0033
--- Epoch 135 / 100000 - 2583 epochs total
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0089
--- Epoch 136 / 100000 - 2584 epochs total
Iteration 0, loss = 0.0141
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0045
--- Epoch 137 / 100000 - 2585 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0191
--- Epoch 138 / 100000 - 2586 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0126
--- Epoch 139 / 100000 - 2587 epochs total
Iteration 0, loss = 0.0240
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0046
--- Epoch 140 / 100000 - 2588 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0111
--- Epoch 141 / 100000 - 2589 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0599
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0042
--- Epoch 142 / 100000 - 2590 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0215
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0127
--- Epoch 143 / 100000 - 2591 epochs total
Iteration 0, loss = 0.0191
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0011
--- Epoch 144 / 100000 - 2592 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0031
--- Epoch 145 / 100000 - 2593 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0166
Iteration 80, loss = 0.0050
--- Epoch 146 / 100000 - 2594 epochs total
Iteration 0, loss = 0.0246
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0152
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0026
--- Epoch 147 / 100000 - 2595 epochs total
Iteration 0, loss = 0.0312
Iteration 20, loss = 0.0207
Iteration 40, loss = 0.0206
Iteration 60, loss = 0.0185
Iteration 80, loss = 0.0488
--- Epoch 148 / 100000 - 2596 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0988
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0150
Iteration 80, loss = 0.0103
--- Epoch 149 / 100000 - 2597 epochs total
Iteration 0, loss = 0.0154
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0030
--- Epoch 150 / 100000 - 2598 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0419
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0169
--- Epoch 151 / 100000 - 2599 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0146
Iteration 60, loss = 0.0183
Iteration 80, loss = 0.0034
--- Epoch 152 / 100000 - 2600 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0060
--- Epoch 153 / 100000 - 2601 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0162
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0062
--- Epoch 154 / 100000 - 2602 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0231
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0421
Iteration 80, loss = 0.0150
--- Epoch 155 / 100000 - 2603 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0038
--- Epoch 156 / 100000 - 2604 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0379
Iteration 80, loss = 0.0042
--- Epoch 157 / 100000 - 2605 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0132
--- Epoch 158 / 100000 - 2606 epochs total
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0169
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0022
--- Epoch 159 / 100000 - 2607 epochs total
Iteration 0, loss = 0.0321
Iteration 20, loss = 0.0136
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0224
Iteration 80, loss = 0.0124
--- Epoch 160 / 100000 - 2608 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0309
Iteration 60, loss = 0.0282
Iteration 80, loss = 0.0080
--- Epoch 161 / 100000 - 2609 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0031
--- Epoch 162 / 100000 - 2610 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0087
--- Epoch 163 / 100000 - 2611 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0329
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0044
--- Epoch 164 / 100000 - 2612 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0233
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0313
--- Epoch 165 / 100000 - 2613 epochs total
Iteration 0, loss = 0.0309
Iteration 20, loss = 0.0140
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0099
--- Epoch 166 / 100000 - 2614 epochs total
Iteration 0, loss = 0.0363
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0155
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0023
--- Epoch 167 / 100000 - 2615 epochs total
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0056
--- Epoch 168 / 100000 - 2616 epochs total
Iteration 0, loss = 0.0224
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0141
Iteration 60, loss = 0.0299
Iteration 80, loss = 0.0073
--- Epoch 169 / 100000 - 2617 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0365
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0136
Iteration 80, loss = 0.0124
--- Epoch 170 / 100000 - 2618 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0009
--- Epoch 171 / 100000 - 2619 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0175
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0009
--- Epoch 172 / 100000 - 2620 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0050
--- Epoch 173 / 100000 - 2621 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0210
Iteration 80, loss = 0.0061
--- Epoch 174 / 100000 - 2622 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0183
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0039
--- Epoch 175 / 100000 - 2623 epochs total
Iteration 0, loss = 0.0300
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0041
--- Epoch 176 / 100000 - 2624 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0348
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0083
--- Epoch 177 / 100000 - 2625 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0034
--- Epoch 178 / 100000 - 2626 epochs total
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0035
--- Epoch 179 / 100000 - 2627 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0367
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0092
--- Epoch 180 / 100000 - 2628 epochs total
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0062
--- Epoch 181 / 100000 - 2629 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0482
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0096
--- Epoch 182 / 100000 - 2630 epochs total
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0038
--- Epoch 183 / 100000 - 2631 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0196
Iteration 80, loss = 0.0019
--- Epoch 184 / 100000 - 2632 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0043
--- Epoch 185 / 100000 - 2633 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0123
--- Epoch 186 / 100000 - 2634 epochs total
Iteration 0, loss = 0.0289
Iteration 20, loss = 0.0132
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0052
--- Epoch 187 / 100000 - 2635 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0101
Iteration 80, loss = 0.0060
--- Epoch 188 / 100000 - 2636 epochs total
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0047
--- Epoch 189 / 100000 - 2637 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0196
--- Epoch 190 / 100000 - 2638 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0279
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0037
--- Epoch 191 / 100000 - 2639 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0423
Iteration 40, loss = 0.0209
Iteration 60, loss = 0.0097
Iteration 80, loss = 0.1049
--- Epoch 192 / 100000 - 2640 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0057
--- Epoch 193 / 100000 - 2641 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0201
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0145
Iteration 80, loss = 0.0033
--- Epoch 194 / 100000 - 2642 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0084
--- Epoch 195 / 100000 - 2643 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0324
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0220
--- Epoch 196 / 100000 - 2644 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0169
Iteration 80, loss = 0.0174
--- Epoch 197 / 100000 - 2645 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0165
Iteration 60, loss = 0.0143
Iteration 80, loss = 0.0146
--- Epoch 198 / 100000 - 2646 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0123
Iteration 80, loss = 0.0037
--- Epoch 199 / 100000 - 2647 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0185
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0021
--- Epoch 200 / 100000 - 2648 epochs total
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0191
--- Epoch 201 / 100000 - 2649 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0157
--- Epoch 202 / 100000 - 2650 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0117
Iteration 40, loss = 0.0250
Iteration 60, loss = 0.0270
Iteration 80, loss = 0.0079
--- Epoch 203 / 100000 - 2651 epochs total
Iteration 0, loss = 0.0422
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0188
--- Epoch 204 / 100000 - 2652 epochs total
Iteration 0, loss = 0.0251
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0181
Iteration 80, loss = 0.0147
--- Epoch 205 / 100000 - 2653 epochs total
Iteration 0, loss = 0.0438
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0122
--- Epoch 206 / 100000 - 2654 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0672
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0047
--- Epoch 207 / 100000 - 2655 epochs total
Iteration 0, loss = 0.0101
Iteration 20, loss = 0.0507
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0037
--- Epoch 208 / 100000 - 2656 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0136
Iteration 80, loss = 0.0029
--- Epoch 209 / 100000 - 2657 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0039
--- Epoch 210 / 100000 - 2658 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0058
--- Epoch 211 / 100000 - 2659 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0181
Iteration 40, loss = 0.0124
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0688
--- Epoch 212 / 100000 - 2660 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0180
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0206
--- Epoch 213 / 100000 - 2661 epochs total
Iteration 0, loss = 0.0346
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0211
--- Epoch 214 / 100000 - 2662 epochs total
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0299
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0107
--- Epoch 215 / 100000 - 2663 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0243
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0016
--- Epoch 216 / 100000 - 2664 epochs total
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0201
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0179
--- Epoch 217 / 100000 - 2665 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0210
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0035
--- Epoch 218 / 100000 - 2666 epochs total
Iteration 0, loss = 0.0169
Iteration 20, loss = 0.0126
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0118
--- Epoch 219 / 100000 - 2667 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0136
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0019
--- Epoch 220 / 100000 - 2668 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0880
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0063
--- Epoch 221 / 100000 - 2669 epochs total
Iteration 0, loss = 0.0369
Iteration 20, loss = 0.0123
Iteration 40, loss = 0.0636
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0090
--- Epoch 222 / 100000 - 2670 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0237
Iteration 80, loss = 0.0056
--- Epoch 223 / 100000 - 2671 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0086
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0090
--- Epoch 224 / 100000 - 2672 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0159
Iteration 40, loss = 0.0164
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0979
--- Epoch 225 / 100000 - 2673 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0238
Iteration 60, loss = 0.0329
Iteration 80, loss = 0.0119
--- Epoch 226 / 100000 - 2674 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0083
Iteration 60, loss = 0.0097
Iteration 80, loss = 0.0104
--- Epoch 227 / 100000 - 2675 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0317
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0254
Iteration 80, loss = 0.0030
--- Epoch 228 / 100000 - 2676 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0119
--- Epoch 229 / 100000 - 2677 epochs total
Iteration 0, loss = 0.0358
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0249
Iteration 80, loss = 0.0260
--- Epoch 230 / 100000 - 2678 epochs total
Iteration 0, loss = 0.0333
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0145
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0051
--- Epoch 231 / 100000 - 2679 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0153
Iteration 40, loss = 0.0158
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0017
--- Epoch 232 / 100000 - 2680 epochs total
Iteration 0, loss = 0.0517
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0180
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0047
--- Epoch 233 / 100000 - 2681 epochs total
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0223
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0162
--- Epoch 234 / 100000 - 2682 epochs total
Iteration 0, loss = 0.0179
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0123
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0206
--- Epoch 235 / 100000 - 2683 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0247
Iteration 40, loss = 0.0144
Iteration 60, loss = 0.0168
Iteration 80, loss = 0.0036
--- Epoch 236 / 100000 - 2684 epochs total
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0125
Iteration 80, loss = 0.0191
--- Epoch 237 / 100000 - 2685 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0090
--- Epoch 238 / 100000 - 2686 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0137
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0024
--- Epoch 239 / 100000 - 2687 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0097
Iteration 80, loss = 0.0071
--- Epoch 240 / 100000 - 2688 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0131
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0081
--- Epoch 241 / 100000 - 2689 epochs total
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0043
--- Epoch 242 / 100000 - 2690 epochs total
Iteration 0, loss = 0.0153
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0124
Iteration 60, loss = 0.0234
Iteration 80, loss = 0.0105
--- Epoch 243 / 100000 - 2691 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0052
--- Epoch 244 / 100000 - 2692 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0027
--- Epoch 245 / 100000 - 2693 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0165
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0233
--- Epoch 246 / 100000 - 2694 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0245
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0224
--- Epoch 247 / 100000 - 2695 epochs total
Iteration 0, loss = 0.0151
Iteration 20, loss = 0.0147
Iteration 40, loss = 0.0955
Iteration 60, loss = 0.0218
Iteration 80, loss = 0.0178
--- Epoch 248 / 100000 - 2696 epochs total
Iteration 0, loss = 0.0084
Iteration 20, loss = 0.0193
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0162
Iteration 80, loss = 0.0056
--- Epoch 249 / 100000 - 2697 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0080
--- Epoch 250 / 100000 - 2698 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0110
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0526
--- Epoch 251 / 100000 - 2699 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0036
--- Epoch 252 / 100000 - 2700 epochs total
Iteration 0, loss = 0.0276
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0032
--- Epoch 253 / 100000 - 2701 epochs total
Iteration 0, loss = 0.0232
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0062
--- Epoch 254 / 100000 - 2702 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0191
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0044
--- Epoch 255 / 100000 - 2703 epochs total
Iteration 0, loss = 0.0131
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0036
--- Epoch 256 / 100000 - 2704 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0305
Iteration 80, loss = 0.0095
--- Epoch 257 / 100000 - 2705 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0132
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0158
--- Epoch 258 / 100000 - 2706 epochs total
Iteration 0, loss = 0.0179
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0311
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0134
--- Epoch 259 / 100000 - 2707 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0042
--- Epoch 260 / 100000 - 2708 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0041
--- Epoch 261 / 100000 - 2709 epochs total
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0108
Iteration 80, loss = 0.0081
--- Epoch 262 / 100000 - 2710 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0062
--- Epoch 263 / 100000 - 2711 epochs total
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0065
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0150
Iteration 80, loss = 0.0147
--- Epoch 264 / 100000 - 2712 epochs total
Iteration 0, loss = 0.0580
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0121
Iteration 60, loss = 0.0184
Iteration 80, loss = 0.0272
--- Epoch 265 / 100000 - 2713 epochs total
Iteration 0, loss = 0.0591
Iteration 20, loss = 0.0453
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0201
Iteration 80, loss = 0.0517
--- Epoch 266 / 100000 - 2714 epochs total
Iteration 0, loss = 0.0177
Iteration 20, loss = 0.0207
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0020
--- Epoch 267 / 100000 - 2715 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0248
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0129
--- Epoch 268 / 100000 - 2716 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0115
Iteration 80, loss = 0.0070
--- Epoch 269 / 100000 - 2717 epochs total
Iteration 0, loss = 0.0051
Iteration 20, loss = 0.0251
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0372
--- Epoch 270 / 100000 - 2718 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0170
Iteration 80, loss = 0.0291
--- Epoch 271 / 100000 - 2719 epochs total
Iteration 0, loss = 0.0201
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0268
Iteration 80, loss = 0.0028
--- Epoch 272 / 100000 - 2720 epochs total
Iteration 0, loss = 0.0219
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0334
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0114
--- Epoch 273 / 100000 - 2721 epochs total
Iteration 0, loss = 0.0390
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0115
Iteration 80, loss = 0.0174
--- Epoch 274 / 100000 - 2722 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0012
--- Epoch 275 / 100000 - 2723 epochs total
Iteration 0, loss = 0.0190
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0306
--- Epoch 276 / 100000 - 2724 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0038
--- Epoch 277 / 100000 - 2725 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0147
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0133
--- Epoch 278 / 100000 - 2726 epochs total
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0202
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0024
--- Epoch 279 / 100000 - 2727 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0266
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0154
Iteration 80, loss = 0.0042
--- Epoch 280 / 100000 - 2728 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0350
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0351
Iteration 80, loss = 0.0012
--- Epoch 281 / 100000 - 2729 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0039
--- Epoch 282 / 100000 - 2730 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0187
Iteration 80, loss = 0.0075
--- Epoch 283 / 100000 - 2731 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0162
Iteration 40, loss = 0.0090
Iteration 60, loss = 0.0144
Iteration 80, loss = 0.0141
--- Epoch 284 / 100000 - 2732 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0251
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0058
--- Epoch 285 / 100000 - 2733 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0034
--- Epoch 286 / 100000 - 2734 epochs total
Iteration 0, loss = 0.0376
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0156
--- Epoch 287 / 100000 - 2735 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0027
--- Epoch 288 / 100000 - 2736 epochs total
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0189
Iteration 60, loss = 0.0123
Iteration 80, loss = 0.0057
--- Epoch 289 / 100000 - 2737 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0172
--- Epoch 290 / 100000 - 2738 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0222
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0234
Iteration 80, loss = 0.0126
--- Epoch 291 / 100000 - 2739 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0099
--- Epoch 292 / 100000 - 2740 epochs total
Iteration 0, loss = 0.0139
Iteration 20, loss = 0.0235
Iteration 40, loss = 0.0124
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0080
--- Epoch 293 / 100000 - 2741 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0374
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0067
--- Epoch 294 / 100000 - 2742 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0257
Iteration 80, loss = 0.0092
--- Epoch 295 / 100000 - 2743 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0110
Iteration 60, loss = 0.0115
Iteration 80, loss = 0.0132
--- Epoch 296 / 100000 - 2744 epochs total
Iteration 0, loss = 0.0178
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0076
--- Epoch 297 / 100000 - 2745 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0144
--- Epoch 298 / 100000 - 2746 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0045
--- Epoch 299 / 100000 - 2747 epochs total
Iteration 0, loss = 0.0130
Iteration 20, loss = 0.0122
Iteration 40, loss = 0.0305
Iteration 60, loss = 0.0097
Iteration 80, loss = 0.0225
--- Epoch 300 / 100000 - 2748 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0116
--- Epoch 301 / 100000 - 2749 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0141
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0285
Iteration 80, loss = 0.0027
--- Epoch 302 / 100000 - 2750 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0215
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0066
--- Epoch 303 / 100000 - 2751 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0215
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0036
--- Epoch 304 / 100000 - 2752 epochs total
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0028
--- Epoch 305 / 100000 - 2753 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0010
--- Epoch 306 / 100000 - 2754 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0014
--- Epoch 307 / 100000 - 2755 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0136
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0026
--- Epoch 308 / 100000 - 2756 epochs total
Iteration 0, loss = 0.0369
Iteration 20, loss = 0.0169
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0174
Iteration 80, loss = 0.0123
--- Epoch 309 / 100000 - 2757 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0232
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0151
--- Epoch 310 / 100000 - 2758 epochs total
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0119
--- Epoch 311 / 100000 - 2759 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0157
Iteration 80, loss = 0.0062
--- Epoch 312 / 100000 - 2760 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0439
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0138
Iteration 80, loss = 0.0211
--- Epoch 313 / 100000 - 2761 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0009
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0012
--- Epoch 314 / 100000 - 2762 epochs total
Iteration 0, loss = 0.0131
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0170
Iteration 60, loss = 0.0177
Iteration 80, loss = 0.0178
--- Epoch 315 / 100000 - 2763 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0086
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0196
Iteration 80, loss = 0.0088
--- Epoch 316 / 100000 - 2764 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0138
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0046
--- Epoch 317 / 100000 - 2765 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0023
--- Epoch 318 / 100000 - 2766 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0065
Iteration 40, loss = 0.0166
Iteration 60, loss = 0.0204
Iteration 80, loss = 0.0100
--- Epoch 319 / 100000 - 2767 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0115
Iteration 40, loss = 0.0167
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0012
--- Epoch 320 / 100000 - 2768 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0119
--- Epoch 321 / 100000 - 2769 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0131
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0040
--- Epoch 322 / 100000 - 2770 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0164
Iteration 80, loss = 0.0131
--- Epoch 323 / 100000 - 2771 epochs total
Iteration 0, loss = 0.0243
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0018
--- Epoch 324 / 100000 - 2772 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0180
Iteration 60, loss = 0.0203
Iteration 80, loss = 0.0300
--- Epoch 325 / 100000 - 2773 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0202
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0025
--- Epoch 326 / 100000 - 2774 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0327
Iteration 60, loss = 0.0142
Iteration 80, loss = 0.0072
--- Epoch 327 / 100000 - 2775 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0232
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0037
--- Epoch 328 / 100000 - 2776 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0306
--- Epoch 329 / 100000 - 2777 epochs total
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0136
Iteration 80, loss = 0.0319
--- Epoch 330 / 100000 - 2778 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0093
--- Epoch 331 / 100000 - 2779 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0070
--- Epoch 332 / 100000 - 2780 epochs total
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0116
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0044
--- Epoch 333 / 100000 - 2781 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0134
Iteration 60, loss = 0.0121
Iteration 80, loss = 0.0037
--- Epoch 334 / 100000 - 2782 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0171
Iteration 80, loss = 0.0070
--- Epoch 335 / 100000 - 2783 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0155
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0065
--- Epoch 336 / 100000 - 2784 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0158
Iteration 60, loss = 0.0591
Iteration 80, loss = 0.0057
--- Epoch 337 / 100000 - 2785 epochs total
Iteration 0, loss = 0.0230
Iteration 20, loss = 0.0300
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0221
Iteration 80, loss = 0.0169
--- Epoch 338 / 100000 - 2786 epochs total
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0250
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0094
--- Epoch 339 / 100000 - 2787 epochs total
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0239
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0123
Iteration 80, loss = 0.0107
--- Epoch 340 / 100000 - 2788 epochs total
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0031
--- Epoch 341 / 100000 - 2789 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0122
--- Epoch 342 / 100000 - 2790 epochs total
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0685
Iteration 80, loss = 0.0092
--- Epoch 343 / 100000 - 2791 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0235
Iteration 60, loss = 0.0172
Iteration 80, loss = 0.0051
--- Epoch 344 / 100000 - 2792 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0807
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0138
--- Epoch 345 / 100000 - 2793 epochs total
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0099
Iteration 80, loss = 0.0048
--- Epoch 346 / 100000 - 2794 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0170
Iteration 80, loss = 0.0027
--- Epoch 347 / 100000 - 2795 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0218
Iteration 60, loss = 0.0213
Iteration 80, loss = 0.0049
--- Epoch 348 / 100000 - 2796 epochs total
Iteration 0, loss = 0.0138
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0176
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0100
--- Epoch 349 / 100000 - 2797 epochs total
Iteration 0, loss = 0.0231
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0054
--- Epoch 350 / 100000 - 2798 epochs total
Iteration 0, loss = 0.0177
Iteration 20, loss = 0.0175
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0211
Iteration 80, loss = 0.0035
--- Epoch 351 / 100000 - 2799 epochs total
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0036
--- Epoch 352 / 100000 - 2800 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0114
--- Epoch 353 / 100000 - 2801 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0148
--- Epoch 354 / 100000 - 2802 epochs total
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0044
--- Epoch 355 / 100000 - 2803 epochs total
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0882
--- Epoch 356 / 100000 - 2804 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0140
Iteration 40, loss = 0.0124
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0097
--- Epoch 357 / 100000 - 2805 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0364
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0131
Iteration 80, loss = 0.0112
--- Epoch 358 / 100000 - 2806 epochs total
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0278
--- Epoch 359 / 100000 - 2807 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0048
--- Epoch 360 / 100000 - 2808 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0145
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0024
--- Epoch 361 / 100000 - 2809 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0148
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0016
--- Epoch 362 / 100000 - 2810 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0010
--- Epoch 363 / 100000 - 2811 epochs total
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0036
--- Epoch 364 / 100000 - 2812 epochs total
Iteration 0, loss = 0.0280
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0158
--- Epoch 365 / 100000 - 2813 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0144
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0027
--- Epoch 366 / 100000 - 2814 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0322
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0015
--- Epoch 367 / 100000 - 2815 epochs total
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0282
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0063
--- Epoch 368 / 100000 - 2816 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0115
Iteration 40, loss = 0.0135
Iteration 60, loss = 0.0164
Iteration 80, loss = 0.0084
--- Epoch 369 / 100000 - 2817 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0037
--- Epoch 370 / 100000 - 2818 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0058
--- Epoch 371 / 100000 - 2819 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0150
Iteration 80, loss = 0.0102
--- Epoch 372 / 100000 - 2820 epochs total
Iteration 0, loss = 0.0170
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0219
--- Epoch 373 / 100000 - 2821 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0016
--- Epoch 374 / 100000 - 2822 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0023
--- Epoch 375 / 100000 - 2823 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0123
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0111
--- Epoch 376 / 100000 - 2824 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0169
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0352
Iteration 80, loss = 0.0037
--- Epoch 377 / 100000 - 2825 epochs total
Iteration 0, loss = 0.0183
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0120
Iteration 80, loss = 0.0039
--- Epoch 378 / 100000 - 2826 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0275
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0041
--- Epoch 379 / 100000 - 2827 epochs total
Iteration 0, loss = 0.0317
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0239
Iteration 80, loss = 0.0051
--- Epoch 380 / 100000 - 2828 epochs total
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0087
--- Epoch 381 / 100000 - 2829 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0016
--- Epoch 382 / 100000 - 2830 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0008
Iteration 80, loss = 0.0044
--- Epoch 383 / 100000 - 2831 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0234
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0095
--- Epoch 384 / 100000 - 2832 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0263
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0228
Iteration 80, loss = 0.0047
--- Epoch 385 / 100000 - 2833 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0097
Iteration 80, loss = 0.0053
--- Epoch 386 / 100000 - 2834 epochs total
Iteration 0, loss = 0.0192
Iteration 20, loss = 0.0168
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0119
--- Epoch 387 / 100000 - 2835 epochs total
Iteration 0, loss = 0.0083
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0051
--- Epoch 388 / 100000 - 2836 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0249
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0032
--- Epoch 389 / 100000 - 2837 epochs total
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0113
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0091
--- Epoch 390 / 100000 - 2838 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0258
--- Epoch 391 / 100000 - 2839 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0049
--- Epoch 392 / 100000 - 2840 epochs total
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0707
Iteration 80, loss = 0.0114
--- Epoch 393 / 100000 - 2841 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0046
--- Epoch 394 / 100000 - 2842 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0112
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0082
--- Epoch 395 / 100000 - 2843 epochs total
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0112
--- Epoch 396 / 100000 - 2844 epochs total
Iteration 0, loss = 0.0201
Iteration 20, loss = 0.0138
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0039
--- Epoch 397 / 100000 - 2845 epochs total
Iteration 0, loss = 0.0330
Iteration 20, loss = 0.0176
Iteration 40, loss = 0.0102
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0084
--- Epoch 398 / 100000 - 2846 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0076
--- Epoch 399 / 100000 - 2847 epochs total
Iteration 0, loss = 0.0167
Iteration 20, loss = 0.0304
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0131
Iteration 80, loss = 0.0138
--- Epoch 400 / 100000 - 2848 epochs total
Iteration 0, loss = 0.0182
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0358
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0033
--- Epoch 401 / 100000 - 2849 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0248
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0408
--- Epoch 402 / 100000 - 2850 epochs total
Iteration 0, loss = 0.0139
Iteration 20, loss = 0.0249
Iteration 40, loss = 0.0178
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0020
--- Epoch 403 / 100000 - 2851 epochs total
Iteration 0, loss = 0.0117
Iteration 20, loss = 0.0386
Iteration 40, loss = 0.0131
Iteration 60, loss = 0.0352
Iteration 80, loss = 0.0109
--- Epoch 404 / 100000 - 2852 epochs total
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0130
--- Epoch 405 / 100000 - 2853 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0133
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0089
--- Epoch 406 / 100000 - 2854 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0343
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0066
--- Epoch 407 / 100000 - 2855 epochs total
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0506
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0030
--- Epoch 408 / 100000 - 2856 epochs total
Iteration 0, loss = 0.0552
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0170
Iteration 60, loss = 0.0146
Iteration 80, loss = 0.0073
--- Epoch 409 / 100000 - 2857 epochs total
Iteration 0, loss = 0.0151
Iteration 20, loss = 0.0229
Iteration 40, loss = 0.0074
Iteration 60, loss = 0.0101
Iteration 80, loss = 0.0061
--- Epoch 410 / 100000 - 2858 epochs total
Iteration 0, loss = 0.0048
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0191
Iteration 80, loss = 0.0040
--- Epoch 411 / 100000 - 2859 epochs total
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0053
--- Epoch 412 / 100000 - 2860 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0135
--- Epoch 413 / 100000 - 2861 epochs total
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0122
Iteration 80, loss = 0.0074
--- Epoch 414 / 100000 - 2862 epochs total
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0054
--- Epoch 415 / 100000 - 2863 epochs total
Iteration 0, loss = 0.0452
Iteration 20, loss = 0.0132
Iteration 40, loss = 0.0078
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0154
--- Epoch 416 / 100000 - 2864 epochs total
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0298
Iteration 40, loss = 0.0213
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0145
--- Epoch 417 / 100000 - 2865 epochs total
Iteration 0, loss = 0.0071
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0282
--- Epoch 418 / 100000 - 2866 epochs total
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0295
Iteration 80, loss = 0.0091
--- Epoch 419 / 100000 - 2867 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0171
--- Epoch 420 / 100000 - 2868 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0078
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0016
--- Epoch 421 / 100000 - 2869 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0121
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0017
--- Epoch 422 / 100000 - 2870 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0226
Iteration 80, loss = 0.0035
--- Epoch 423 / 100000 - 2871 epochs total
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0115
--- Epoch 424 / 100000 - 2872 epochs total
Iteration 0, loss = 0.0201
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0141
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0429
--- Epoch 425 / 100000 - 2873 epochs total
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0014
--- Epoch 426 / 100000 - 2874 epochs total
Iteration 0, loss = 0.0592
Iteration 20, loss = 0.0187
Iteration 40, loss = 0.0148
Iteration 60, loss = 0.0333
Iteration 80, loss = 0.0169
--- Epoch 427 / 100000 - 2875 epochs total
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0141
--- Epoch 428 / 100000 - 2876 epochs total
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0108
--- Epoch 429 / 100000 - 2877 epochs total
Iteration 0, loss = 0.0217
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0201
--- Epoch 430 / 100000 - 2878 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0213
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0052
--- Epoch 431 / 100000 - 2879 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0179
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0013
--- Epoch 432 / 100000 - 2880 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0123
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0029
--- Epoch 433 / 100000 - 2881 epochs total
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0102
Iteration 80, loss = 0.0218
--- Epoch 434 / 100000 - 2882 epochs total
Iteration 0, loss = 0.0149
Iteration 20, loss = 0.0172
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0110
--- Epoch 435 / 100000 - 2883 epochs total
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0229
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0066
--- Epoch 436 / 100000 - 2884 epochs total
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0127
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0087
--- Epoch 437 / 100000 - 2885 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0258
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0101
Iteration 80, loss = 0.0106
--- Epoch 438 / 100000 - 2886 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0181
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0221
--- Epoch 439 / 100000 - 2887 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0713
Iteration 80, loss = 0.0018
--- Epoch 440 / 100000 - 2888 epochs total
Iteration 0, loss = 0.0158
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0017
--- Epoch 441 / 100000 - 2889 epochs total
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0129
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0040
--- Epoch 442 / 100000 - 2890 epochs total
Iteration 0, loss = 0.0268
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0490
--- Epoch 443 / 100000 - 2891 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0133
Iteration 80, loss = 0.0040
--- Epoch 444 / 100000 - 2892 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0114
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0223
--- Epoch 445 / 100000 - 2893 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0286
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0070
--- Epoch 446 / 100000 - 2894 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0160
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0026
--- Epoch 447 / 100000 - 2895 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0136
Iteration 40, loss = 0.0199
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0029
--- Epoch 448 / 100000 - 2896 epochs total
Iteration 0, loss = 0.0330
Iteration 20, loss = 0.0511
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0094
--- Epoch 449 / 100000 - 2897 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0011
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0083
--- Epoch 450 / 100000 - 2898 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0188
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0083
--- Epoch 451 / 100000 - 2899 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0036
--- Epoch 452 / 100000 - 2900 epochs total
Iteration 0, loss = 0.0202
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0172
Iteration 80, loss = 0.0104
--- Epoch 453 / 100000 - 2901 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0137
--- Epoch 454 / 100000 - 2902 epochs total
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0373
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0082
--- Epoch 455 / 100000 - 2903 epochs total
Iteration 0, loss = 0.0144
Iteration 20, loss = 0.0086
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0259
--- Epoch 456 / 100000 - 2904 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0172
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0219
Iteration 80, loss = 0.0040
--- Epoch 457 / 100000 - 2905 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0095
--- Epoch 458 / 100000 - 2906 epochs total
Iteration 0, loss = 0.0457
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0100
--- Epoch 459 / 100000 - 2907 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0135
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0117
--- Epoch 460 / 100000 - 2908 epochs total
Iteration 0, loss = 0.0388
Iteration 20, loss = 0.0169
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0146
--- Epoch 461 / 100000 - 2909 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0270
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0207
Iteration 80, loss = 0.0048
--- Epoch 462 / 100000 - 2910 epochs total
Iteration 0, loss = 0.0238
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0171
Iteration 80, loss = 0.0201
--- Epoch 463 / 100000 - 2911 epochs total
Iteration 0, loss = 0.0163
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0121
--- Epoch 464 / 100000 - 2912 epochs total
Iteration 0, loss = 0.0008
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0174
Iteration 80, loss = 0.0183
--- Epoch 465 / 100000 - 2913 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0013
Iteration 80, loss = 0.0079
--- Epoch 466 / 100000 - 2914 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0165
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0047
--- Epoch 467 / 100000 - 2915 epochs total
Iteration 0, loss = 0.0195
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0158
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0252
--- Epoch 468 / 100000 - 2916 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0309
Iteration 40, loss = 0.0195
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0419
--- Epoch 469 / 100000 - 2917 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0060
--- Epoch 470 / 100000 - 2918 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0025
--- Epoch 471 / 100000 - 2919 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0136
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0148
--- Epoch 472 / 100000 - 2920 epochs total
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0084
--- Epoch 473 / 100000 - 2921 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0037
--- Epoch 474 / 100000 - 2922 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0192
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0344
--- Epoch 475 / 100000 - 2923 epochs total
Iteration 0, loss = 0.0175
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0166
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0134
--- Epoch 476 / 100000 - 2924 epochs total
Iteration 0, loss = 0.0196
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0037
--- Epoch 477 / 100000 - 2925 epochs total
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0079
--- Epoch 478 / 100000 - 2926 epochs total
Iteration 0, loss = 0.0246
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0112
Iteration 80, loss = 0.0100
--- Epoch 479 / 100000 - 2927 epochs total
Iteration 0, loss = 0.0082
Iteration 20, loss = 0.0195
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0120
Iteration 80, loss = 0.0164
--- Epoch 480 / 100000 - 2928 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0346
Iteration 40, loss = 0.0203
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0035
--- Epoch 481 / 100000 - 2929 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0046
--- Epoch 482 / 100000 - 2930 epochs total
Iteration 0, loss = 0.0303
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0162
Iteration 80, loss = 0.0054
--- Epoch 483 / 100000 - 2931 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0236
Iteration 80, loss = 0.0061
--- Epoch 484 / 100000 - 2932 epochs total
Iteration 0, loss = 0.0650
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0018
--- Epoch 485 / 100000 - 2933 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0061
--- Epoch 486 / 100000 - 2934 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0086
--- Epoch 487 / 100000 - 2935 epochs total
Iteration 0, loss = 0.0163
Iteration 20, loss = 0.0341
Iteration 40, loss = 0.0119
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0034
--- Epoch 488 / 100000 - 2936 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0205
Iteration 60, loss = 0.0055
Iteration 80, loss = 0.0199
--- Epoch 489 / 100000 - 2937 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0029
--- Epoch 490 / 100000 - 2938 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0136
Iteration 80, loss = 0.0111
--- Epoch 491 / 100000 - 2939 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0065
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0299
Iteration 80, loss = 0.0207
--- Epoch 492 / 100000 - 2940 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0142
Iteration 80, loss = 0.0132
--- Epoch 493 / 100000 - 2941 epochs total
Iteration 0, loss = 0.0188
Iteration 20, loss = 0.0296
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0044
--- Epoch 494 / 100000 - 2942 epochs total
Iteration 0, loss = 0.0130
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0087
--- Epoch 495 / 100000 - 2943 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0066
--- Epoch 496 / 100000 - 2944 epochs total
Iteration 0, loss = 0.0462
Iteration 20, loss = 0.0314
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0178
Iteration 80, loss = 0.0037
--- Epoch 497 / 100000 - 2945 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0143
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0127
Iteration 80, loss = 0.0435
--- Epoch 498 / 100000 - 2946 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0026
--- Epoch 499 / 100000 - 2947 epochs total
Iteration 0, loss = 0.0135
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0274
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0215
--- Epoch 500 / 100000 - 2948 epochs total
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0229
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0347
Iteration 80, loss = 0.0085
--- Epoch 501 / 100000 - 2949 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0051
--- Epoch 502 / 100000 - 2950 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0038
--- Epoch 503 / 100000 - 2951 epochs total
Iteration 0, loss = 0.0135
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0012
--- Epoch 504 / 100000 - 2952 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0109
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0073
--- Epoch 505 / 100000 - 2953 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0083
--- Epoch 506 / 100000 - 2954 epochs total
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0037
--- Epoch 507 / 100000 - 2955 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0309
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0032
--- Epoch 508 / 100000 - 2956 epochs total
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0329
Iteration 80, loss = 0.0050
--- Epoch 509 / 100000 - 2957 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0231
Iteration 80, loss = 0.0090
--- Epoch 510 / 100000 - 2958 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0145
--- Epoch 511 / 100000 - 2959 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0094
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0302
--- Epoch 512 / 100000 - 2960 epochs total
Iteration 0, loss = 0.0123
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0188
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0098
--- Epoch 513 / 100000 - 2961 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0053
--- Epoch 514 / 100000 - 2962 epochs total
Iteration 0, loss = 0.0189
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0110
Iteration 80, loss = 0.0229
--- Epoch 515 / 100000 - 2963 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0241
Iteration 80, loss = 0.0072
--- Epoch 516 / 100000 - 2964 epochs total
Iteration 0, loss = 0.0244
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0203
Iteration 80, loss = 0.0194
--- Epoch 517 / 100000 - 2965 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0059
--- Epoch 518 / 100000 - 2966 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0225
Iteration 40, loss = 0.0901
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0017
--- Epoch 519 / 100000 - 2967 epochs total
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0183
--- Epoch 520 / 100000 - 2968 epochs total
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0059
--- Epoch 521 / 100000 - 2969 epochs total
Iteration 0, loss = 0.0297
Iteration 20, loss = 0.0123
Iteration 40, loss = 0.0145
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0139
--- Epoch 522 / 100000 - 2970 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0191
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0135
--- Epoch 523 / 100000 - 2971 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0038
--- Epoch 524 / 100000 - 2972 epochs total
Iteration 0, loss = 0.0284
Iteration 20, loss = 0.0099
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0050
--- Epoch 525 / 100000 - 2973 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0156
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0059
--- Epoch 526 / 100000 - 2974 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0064
--- Epoch 527 / 100000 - 2975 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0129
--- Epoch 528 / 100000 - 2976 epochs total
Iteration 0, loss = 0.0548
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0080
--- Epoch 529 / 100000 - 2977 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0272
Iteration 40, loss = 0.0123
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0209
--- Epoch 530 / 100000 - 2978 epochs total
Iteration 0, loss = 0.0159
Iteration 20, loss = 0.0309
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0108
--- Epoch 531 / 100000 - 2979 epochs total
Iteration 0, loss = 0.0084
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0040
--- Epoch 532 / 100000 - 2980 epochs total
Iteration 0, loss = 0.0294
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0061
--- Epoch 533 / 100000 - 2981 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0290
--- Epoch 534 / 100000 - 2982 epochs total
Iteration 0, loss = 0.0671
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0367
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0180
--- Epoch 535 / 100000 - 2983 epochs total
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0010
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0306
Iteration 80, loss = 0.0119
--- Epoch 536 / 100000 - 2984 epochs total
Iteration 0, loss = 0.0165
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0032
--- Epoch 537 / 100000 - 2985 epochs total
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0121
Iteration 80, loss = 0.0037
--- Epoch 538 / 100000 - 2986 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0247
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0054
--- Epoch 539 / 100000 - 2987 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0280
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0137
--- Epoch 540 / 100000 - 2988 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0197
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0040
--- Epoch 541 / 100000 - 2989 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0174
Iteration 40, loss = 0.0173
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0049
--- Epoch 542 / 100000 - 2990 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0346
Iteration 80, loss = 0.0028
--- Epoch 543 / 100000 - 2991 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0024
--- Epoch 544 / 100000 - 2992 epochs total
Iteration 0, loss = 0.0401
Iteration 20, loss = 0.0229
Iteration 40, loss = 0.0464
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0024
--- Epoch 545 / 100000 - 2993 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0396
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0084
--- Epoch 546 / 100000 - 2994 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0119
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0340
Iteration 80, loss = 0.0076
--- Epoch 547 / 100000 - 2995 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0146
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0065
--- Epoch 548 / 100000 - 2996 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0180
Iteration 40, loss = 0.0250
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0014
--- Epoch 549 / 100000 - 2997 epochs total
Iteration 0, loss = 0.0245
Iteration 20, loss = 0.0153
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0161
Iteration 80, loss = 0.0047
--- Epoch 550 / 100000 - 2998 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0093
--- Epoch 551 / 100000 - 2999 epochs total
Iteration 0, loss = 0.0232
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0262
--- Epoch 552 / 100000 - 3000 epochs total
Iteration 0, loss = 0.0120
Iteration 20, loss = 0.0419
Iteration 40, loss = 0.0122
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0162
--- Epoch 553 / 100000 - 3001 epochs total
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0102
--- Epoch 554 / 100000 - 3002 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0186
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0281
Iteration 80, loss = 0.0221
--- Epoch 555 / 100000 - 3003 epochs total
Iteration 0, loss = 0.0179
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0331
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0025
--- Epoch 556 / 100000 - 3004 epochs total
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0197
Iteration 60, loss = 0.0225
Iteration 80, loss = 0.0034
--- Epoch 557 / 100000 - 3005 epochs total
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0035
--- Epoch 558 / 100000 - 3006 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0186
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0023
--- Epoch 559 / 100000 - 3007 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0173
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0067
--- Epoch 560 / 100000 - 3008 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0155
Iteration 80, loss = 0.0077
--- Epoch 561 / 100000 - 3009 epochs total
Iteration 0, loss = 0.0198
Iteration 20, loss = 0.0261
Iteration 40, loss = 0.0141
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0020
--- Epoch 562 / 100000 - 3010 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0114
--- Epoch 563 / 100000 - 3011 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0089
Iteration 80, loss = 0.0062
--- Epoch 564 / 100000 - 3012 epochs total
Iteration 0, loss = 0.0234
Iteration 20, loss = 0.0306
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0166
--- Epoch 565 / 100000 - 3013 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0076
--- Epoch 566 / 100000 - 3014 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0199
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0107
--- Epoch 567 / 100000 - 3015 epochs total
Iteration 0, loss = 0.0268
Iteration 20, loss = 0.0247
Iteration 40, loss = 0.0285
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0045
--- Epoch 568 / 100000 - 3016 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0160
Iteration 80, loss = 0.0245
--- Epoch 569 / 100000 - 3017 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0161
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0254
--- Epoch 570 / 100000 - 3018 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0036
--- Epoch 571 / 100000 - 3019 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0016
--- Epoch 572 / 100000 - 3020 epochs total
Iteration 0, loss = 0.0101
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0102
Iteration 80, loss = 0.0156
--- Epoch 573 / 100000 - 3021 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0274
Iteration 60, loss = 0.0228
Iteration 80, loss = 0.0013
--- Epoch 574 / 100000 - 3022 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0181
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0048
--- Epoch 575 / 100000 - 3023 epochs total
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0186
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0022
--- Epoch 576 / 100000 - 3024 epochs total
Iteration 0, loss = 0.0191
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0090
--- Epoch 577 / 100000 - 3025 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0012
--- Epoch 578 / 100000 - 3026 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0214
--- Epoch 579 / 100000 - 3027 epochs total
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0345
--- Epoch 580 / 100000 - 3028 epochs total
Iteration 0, loss = 0.0290
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0180
Iteration 80, loss = 0.0287
--- Epoch 581 / 100000 - 3029 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0170
Iteration 80, loss = 0.0088
--- Epoch 582 / 100000 - 3030 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0083
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0016
--- Epoch 583 / 100000 - 3031 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0098
--- Epoch 584 / 100000 - 3032 epochs total
Iteration 0, loss = 0.0151
Iteration 20, loss = 0.0205
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0038
--- Epoch 585 / 100000 - 3033 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0304
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0374
--- Epoch 586 / 100000 - 3034 epochs total
Iteration 0, loss = 0.0077
Iteration 20, loss = 0.0188
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0388
--- Epoch 587 / 100000 - 3035 epochs total
Iteration 0, loss = 0.0069
Iteration 20, loss = 0.0108
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0028
--- Epoch 588 / 100000 - 3036 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0020
--- Epoch 589 / 100000 - 3037 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0021
--- Epoch 590 / 100000 - 3038 epochs total
Iteration 0, loss = 0.0147
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0208
Iteration 80, loss = 0.0101
--- Epoch 591 / 100000 - 3039 epochs total
Iteration 0, loss = 0.0665
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0120
--- Epoch 592 / 100000 - 3040 epochs total
Iteration 0, loss = 0.0193
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0111
--- Epoch 593 / 100000 - 3041 epochs total
Iteration 0, loss = 0.0292
Iteration 20, loss = 0.0414
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0182
--- Epoch 594 / 100000 - 3042 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0166
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0032
--- Epoch 595 / 100000 - 3043 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0127
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0026
--- Epoch 596 / 100000 - 3044 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0361
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0056
--- Epoch 597 / 100000 - 3045 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0056
--- Epoch 598 / 100000 - 3046 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0070
--- Epoch 599 / 100000 - 3047 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0265
Iteration 40, loss = 0.0240
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0114
--- Epoch 600 / 100000 - 3048 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0037
--- Epoch 601 / 100000 - 3049 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0455
Iteration 40, loss = 0.0124
Iteration 60, loss = 0.0156
Iteration 80, loss = 0.0194
--- Epoch 602 / 100000 - 3050 epochs total
Iteration 0, loss = 0.0168
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0161
--- Epoch 603 / 100000 - 3051 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0298
Iteration 60, loss = 0.0108
Iteration 80, loss = 0.0075
--- Epoch 604 / 100000 - 3052 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0176
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0023
--- Epoch 605 / 100000 - 3053 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0102
Iteration 60, loss = 0.0094
Iteration 80, loss = 0.0034
--- Epoch 606 / 100000 - 3054 epochs total
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0071
--- Epoch 607 / 100000 - 3055 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0149
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0118
--- Epoch 608 / 100000 - 3056 epochs total
Iteration 0, loss = 0.0154
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0123
Iteration 80, loss = 0.0028
--- Epoch 609 / 100000 - 3057 epochs total
Iteration 0, loss = 0.0008
Iteration 20, loss = 0.0147
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0068
--- Epoch 610 / 100000 - 3058 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0222
--- Epoch 611 / 100000 - 3059 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0168
--- Epoch 612 / 100000 - 3060 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0383
Iteration 80, loss = 0.0036
--- Epoch 613 / 100000 - 3061 epochs total
Iteration 0, loss = 0.0153
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0056
--- Epoch 614 / 100000 - 3062 epochs total
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0005
Iteration 60, loss = 0.0207
Iteration 80, loss = 0.0099
--- Epoch 615 / 100000 - 3063 epochs total
Iteration 0, loss = 0.0179
Iteration 20, loss = 0.0099
Iteration 40, loss = 0.0299
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0097
--- Epoch 616 / 100000 - 3064 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0085
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0046
--- Epoch 617 / 100000 - 3065 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0099
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0088
--- Epoch 618 / 100000 - 3066 epochs total
Iteration 0, loss = 0.0416
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0318
Iteration 80, loss = 0.0135
--- Epoch 619 / 100000 - 3067 epochs total
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0094
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0047
--- Epoch 620 / 100000 - 3068 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0120
Iteration 40, loss = 0.0211
Iteration 60, loss = 0.0417
Iteration 80, loss = 0.0112
--- Epoch 621 / 100000 - 3069 epochs total
Iteration 0, loss = 0.0203
Iteration 20, loss = 0.0229
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0069
--- Epoch 622 / 100000 - 3070 epochs total
Iteration 0, loss = 0.0177
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0250
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0050
--- Epoch 623 / 100000 - 3071 epochs total
Iteration 0, loss = 0.0062
Iteration 20, loss = 0.0090
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0089
--- Epoch 624 / 100000 - 3072 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0210
Iteration 40, loss = 0.0290
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0021
--- Epoch 625 / 100000 - 3073 epochs total
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0044
--- Epoch 626 / 100000 - 3074 epochs total
Iteration 0, loss = 0.0109
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0065
--- Epoch 627 / 100000 - 3075 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0484
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0109
--- Epoch 628 / 100000 - 3076 epochs total
Iteration 0, loss = 0.0180
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0104
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0019
--- Epoch 629 / 100000 - 3077 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0202
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0117
Iteration 80, loss = 0.0041
--- Epoch 630 / 100000 - 3078 epochs total
Iteration 0, loss = 0.0167
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0151
Iteration 80, loss = 0.0074
--- Epoch 631 / 100000 - 3079 epochs total
Iteration 0, loss = 0.0168
Iteration 20, loss = 0.0049
Iteration 40, loss = 0.0295
Iteration 60, loss = 0.0202
Iteration 80, loss = 0.0041
--- Epoch 632 / 100000 - 3080 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0158
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0166
Iteration 80, loss = 0.0191
--- Epoch 633 / 100000 - 3081 epochs total
Iteration 0, loss = 0.0097
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0128
Iteration 80, loss = 0.0052
--- Epoch 634 / 100000 - 3082 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0202
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0023
--- Epoch 635 / 100000 - 3083 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0317
Iteration 80, loss = 0.0035
--- Epoch 636 / 100000 - 3084 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0156
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0023
--- Epoch 637 / 100000 - 3085 epochs total
Iteration 0, loss = 0.0138
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0290
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0044
--- Epoch 638 / 100000 - 3086 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0082
--- Epoch 639 / 100000 - 3087 epochs total
Iteration 0, loss = 0.0301
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0204
Iteration 60, loss = 0.0236
Iteration 80, loss = 0.0009
--- Epoch 640 / 100000 - 3088 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0280
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0070
--- Epoch 641 / 100000 - 3089 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0061
--- Epoch 642 / 100000 - 3090 epochs total
Iteration 0, loss = 0.0170
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0179
Iteration 80, loss = 0.0037
--- Epoch 643 / 100000 - 3091 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0146
Iteration 40, loss = 0.0168
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0064
--- Epoch 644 / 100000 - 3092 epochs total
Iteration 0, loss = 0.0109
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0211
Iteration 80, loss = 0.0029
--- Epoch 645 / 100000 - 3093 epochs total
Iteration 0, loss = 0.0115
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0257
--- Epoch 646 / 100000 - 3094 epochs total
Iteration 0, loss = 0.0166
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0229
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0045
--- Epoch 647 / 100000 - 3095 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0328
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0135
Iteration 80, loss = 0.0089
--- Epoch 648 / 100000 - 3096 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0018
--- Epoch 649 / 100000 - 3097 epochs total
Iteration 0, loss = 0.0279
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0031
--- Epoch 650 / 100000 - 3098 epochs total
Iteration 0, loss = 0.0105
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0140
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0177
--- Epoch 651 / 100000 - 3099 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0035
--- Epoch 652 / 100000 - 3100 epochs total
Iteration 0, loss = 0.0198
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0268
Iteration 80, loss = 0.0046
--- Epoch 653 / 100000 - 3101 epochs total
Iteration 0, loss = 0.0090
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0208
Iteration 60, loss = 0.0158
Iteration 80, loss = 0.0047
--- Epoch 654 / 100000 - 3102 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0162
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0092
--- Epoch 655 / 100000 - 3103 epochs total
Iteration 0, loss = 0.0199
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0200
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0677
--- Epoch 656 / 100000 - 3104 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0528
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0031
--- Epoch 657 / 100000 - 3105 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0211
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0108
--- Epoch 658 / 100000 - 3106 epochs total
Iteration 0, loss = 0.0214
Iteration 20, loss = 0.0166
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0040
--- Epoch 659 / 100000 - 3107 epochs total
Iteration 0, loss = 0.0243
Iteration 20, loss = 0.0166
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0114
--- Epoch 660 / 100000 - 3108 epochs total
Iteration 0, loss = 0.0300
Iteration 20, loss = 0.0082
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0070
--- Epoch 661 / 100000 - 3109 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0130
--- Epoch 662 / 100000 - 3110 epochs total
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0140
--- Epoch 663 / 100000 - 3111 epochs total
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0159
Iteration 60, loss = 0.0130
Iteration 80, loss = 0.0626
--- Epoch 664 / 100000 - 3112 epochs total
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0265
Iteration 80, loss = 0.0130
--- Epoch 665 / 100000 - 3113 epochs total
Iteration 0, loss = 0.0091
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0238
Iteration 60, loss = 0.0261
Iteration 80, loss = 0.0047
--- Epoch 666 / 100000 - 3114 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0303
Iteration 60, loss = 0.0108
Iteration 80, loss = 0.0022
--- Epoch 667 / 100000 - 3115 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0031
--- Epoch 668 / 100000 - 3116 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0008
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0305
--- Epoch 669 / 100000 - 3117 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0592
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0096
--- Epoch 670 / 100000 - 3118 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0146
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0418
--- Epoch 671 / 100000 - 3119 epochs total
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0170
Iteration 80, loss = 0.0064
--- Epoch 672 / 100000 - 3120 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0845
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0101
--- Epoch 673 / 100000 - 3121 epochs total
Iteration 0, loss = 0.0222
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0177
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0050
--- Epoch 674 / 100000 - 3122 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0086
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0015
--- Epoch 675 / 100000 - 3123 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0392
--- Epoch 676 / 100000 - 3124 epochs total
Iteration 0, loss = 0.0161
Iteration 20, loss = 0.0091
Iteration 40, loss = 0.0954
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0109
--- Epoch 677 / 100000 - 3125 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0070
--- Epoch 678 / 100000 - 3126 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0053
--- Epoch 679 / 100000 - 3127 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0160
Iteration 80, loss = 0.0053
--- Epoch 680 / 100000 - 3128 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0263
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0039
--- Epoch 681 / 100000 - 3129 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0180
Iteration 80, loss = 0.0043
--- Epoch 682 / 100000 - 3130 epochs total
Iteration 0, loss = 0.0322
Iteration 20, loss = 0.0291
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0127
Iteration 80, loss = 0.0058
--- Epoch 683 / 100000 - 3131 epochs total
Iteration 0, loss = 0.0233
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0113
Iteration 60, loss = 0.0340
Iteration 80, loss = 0.0078
--- Epoch 684 / 100000 - 3132 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0126
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0111
--- Epoch 685 / 100000 - 3133 epochs total
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0177
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0094
--- Epoch 686 / 100000 - 3134 epochs total
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0179
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0035
--- Epoch 687 / 100000 - 3135 epochs total
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0168
Iteration 80, loss = 0.0030
--- Epoch 688 / 100000 - 3136 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0161
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0090
--- Epoch 689 / 100000 - 3137 epochs total
Iteration 0, loss = 0.0594
Iteration 20, loss = 0.0210
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0013
--- Epoch 690 / 100000 - 3138 epochs total
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0084
Iteration 60, loss = 0.0169
Iteration 80, loss = 0.0016
--- Epoch 691 / 100000 - 3139 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0078
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0416
Iteration 80, loss = 0.0084
--- Epoch 692 / 100000 - 3140 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0084
Iteration 40, loss = 0.0419
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0056
--- Epoch 693 / 100000 - 3141 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0136
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0018
Iteration 80, loss = 0.0062
--- Epoch 694 / 100000 - 3142 epochs total
Iteration 0, loss = 0.0133
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0340
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0018
--- Epoch 695 / 100000 - 3143 epochs total
Iteration 0, loss = 0.0052
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0038
--- Epoch 696 / 100000 - 3144 epochs total
Iteration 0, loss = 0.0018
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0136
Iteration 80, loss = 0.0090
--- Epoch 697 / 100000 - 3145 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0153
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0096
--- Epoch 698 / 100000 - 3146 epochs total
Iteration 0, loss = 0.0082
Iteration 20, loss = 0.0154
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0239
Iteration 80, loss = 0.0087
--- Epoch 699 / 100000 - 3147 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0195
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0008
--- Epoch 700 / 100000 - 3148 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0117
Iteration 40, loss = 0.0170
Iteration 60, loss = 0.0229
Iteration 80, loss = 0.0188
--- Epoch 701 / 100000 - 3149 epochs total
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0419
Iteration 80, loss = 0.0132
--- Epoch 702 / 100000 - 3150 epochs total
Iteration 0, loss = 0.0221
Iteration 20, loss = 0.0199
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0115
--- Epoch 703 / 100000 - 3151 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0217
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0073
--- Epoch 704 / 100000 - 3152 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0009
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0139
--- Epoch 705 / 100000 - 3153 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0070
Iteration 80, loss = 0.0143
--- Epoch 706 / 100000 - 3154 epochs total
Iteration 0, loss = 0.0437
Iteration 20, loss = 0.0064
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0039
--- Epoch 707 / 100000 - 3155 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0173
--- Epoch 708 / 100000 - 3156 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0145
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0153
Iteration 80, loss = 0.0134
--- Epoch 709 / 100000 - 3157 epochs total
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0245
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0085
Iteration 80, loss = 0.0164
--- Epoch 710 / 100000 - 3158 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0239
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0027
--- Epoch 711 / 100000 - 3159 epochs total
Iteration 0, loss = 0.0220
Iteration 20, loss = 0.0134
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0021
--- Epoch 712 / 100000 - 3160 epochs total
Iteration 0, loss = 0.0256
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0068
--- Epoch 713 / 100000 - 3161 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0150
Iteration 40, loss = 0.0150
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0610
--- Epoch 714 / 100000 - 3162 epochs total
Iteration 0, loss = 0.0100
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0137
Iteration 80, loss = 0.0086
--- Epoch 715 / 100000 - 3163 epochs total
Iteration 0, loss = 0.0074
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0182
Iteration 80, loss = 0.0068
--- Epoch 716 / 100000 - 3164 epochs total
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0185
Iteration 80, loss = 0.0039
--- Epoch 717 / 100000 - 3165 epochs total
Iteration 0, loss = 0.0103
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0200
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0121
--- Epoch 718 / 100000 - 3166 epochs total
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0131
Iteration 40, loss = 0.0196
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0017
--- Epoch 719 / 100000 - 3167 epochs total
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0078
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0059
--- Epoch 720 / 100000 - 3168 epochs total
Iteration 0, loss = 0.0624
Iteration 20, loss = 0.0036
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0071
--- Epoch 721 / 100000 - 3169 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0314
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0347
--- Epoch 722 / 100000 - 3170 epochs total
Iteration 0, loss = 0.0101
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0143
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0017
--- Epoch 723 / 100000 - 3171 epochs total
Iteration 0, loss = 0.0146
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0201
--- Epoch 724 / 100000 - 3172 epochs total
Iteration 0, loss = 0.0092
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0090
--- Epoch 725 / 100000 - 3173 epochs total
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0204
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0114
--- Epoch 726 / 100000 - 3174 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0072
Iteration 80, loss = 0.0087
--- Epoch 727 / 100000 - 3175 epochs total
Iteration 0, loss = 0.0186
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0204
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0078
--- Epoch 728 / 100000 - 3176 epochs total
Iteration 0, loss = 0.0214
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0082
Iteration 80, loss = 0.0090
--- Epoch 729 / 100000 - 3177 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0185
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0192
--- Epoch 730 / 100000 - 3178 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0161
Iteration 80, loss = 0.0457
--- Epoch 731 / 100000 - 3179 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0482
--- Epoch 732 / 100000 - 3180 epochs total
Iteration 0, loss = 0.0095
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0024
--- Epoch 733 / 100000 - 3181 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0174
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0121
--- Epoch 734 / 100000 - 3182 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0049
--- Epoch 735 / 100000 - 3183 epochs total
Iteration 0, loss = 0.0340
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0083
Iteration 60, loss = 0.0174
Iteration 80, loss = 0.0023
--- Epoch 736 / 100000 - 3184 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0256
Iteration 40, loss = 0.0099
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0025
--- Epoch 737 / 100000 - 3185 epochs total
Iteration 0, loss = 0.0372
Iteration 20, loss = 0.0137
Iteration 40, loss = 0.0152
Iteration 60, loss = 0.0150
Iteration 80, loss = 0.0051
--- Epoch 738 / 100000 - 3186 epochs total
Iteration 0, loss = 0.0178
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0051
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0040
--- Epoch 739 / 100000 - 3187 epochs total
Iteration 0, loss = 0.0494
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0240
Iteration 80, loss = 0.0037
--- Epoch 740 / 100000 - 3188 epochs total
Iteration 0, loss = 0.0086
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0021
--- Epoch 741 / 100000 - 3189 epochs total
Iteration 0, loss = 0.0265
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0087
--- Epoch 742 / 100000 - 3190 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0010
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0113
--- Epoch 743 / 100000 - 3191 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0045
--- Epoch 744 / 100000 - 3192 epochs total
Iteration 0, loss = 0.0123
Iteration 20, loss = 0.0103
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0166
--- Epoch 745 / 100000 - 3193 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0186
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0130
--- Epoch 746 / 100000 - 3194 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0031
--- Epoch 747 / 100000 - 3195 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0109
Iteration 40, loss = 0.0246
Iteration 60, loss = 0.0271
Iteration 80, loss = 0.0047
--- Epoch 748 / 100000 - 3196 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0089
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0064
Iteration 80, loss = 0.0019
--- Epoch 749 / 100000 - 3197 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0073
Iteration 80, loss = 0.0351
--- Epoch 750 / 100000 - 3198 epochs total
Iteration 0, loss = 0.0296
Iteration 20, loss = 0.0365
Iteration 40, loss = 0.0226
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0044
--- Epoch 751 / 100000 - 3199 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0078
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0119
--- Epoch 752 / 100000 - 3200 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0081
Iteration 60, loss = 0.0127
Iteration 80, loss = 0.0024
--- Epoch 753 / 100000 - 3201 epochs total
Iteration 0, loss = 0.0197
Iteration 20, loss = 0.0225
Iteration 40, loss = 0.0135
Iteration 60, loss = 0.0197
Iteration 80, loss = 0.0064
--- Epoch 754 / 100000 - 3202 epochs total
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0090
--- Epoch 755 / 100000 - 3203 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0231
Iteration 60, loss = 0.0062
Iteration 80, loss = 0.0026
--- Epoch 756 / 100000 - 3204 epochs total
Iteration 0, loss = 0.0011
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0013
--- Epoch 757 / 100000 - 3205 epochs total
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0267
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0079
--- Epoch 758 / 100000 - 3206 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0081
--- Epoch 759 / 100000 - 3207 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0157
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0055
--- Epoch 760 / 100000 - 3208 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0276
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0098
--- Epoch 761 / 100000 - 3209 epochs total
Iteration 0, loss = 0.0158
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0072
--- Epoch 762 / 100000 - 3210 epochs total
Iteration 0, loss = 0.0132
Iteration 20, loss = 0.0199
Iteration 40, loss = 0.0230
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0130
--- Epoch 763 / 100000 - 3211 epochs total
Iteration 0, loss = 0.0190
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0676
Iteration 80, loss = 0.0034
--- Epoch 764 / 100000 - 3212 epochs total
Iteration 0, loss = 0.0151
Iteration 20, loss = 0.0099
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0022
--- Epoch 765 / 100000 - 3213 epochs total
Iteration 0, loss = 0.0121
Iteration 20, loss = 0.0086
Iteration 40, loss = 0.0066
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0033
--- Epoch 766 / 100000 - 3214 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0248
Iteration 40, loss = 0.0630
Iteration 60, loss = 0.0098
Iteration 80, loss = 0.0032
--- Epoch 767 / 100000 - 3215 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0250
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0180
Iteration 80, loss = 0.0056
--- Epoch 768 / 100000 - 3216 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0377
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0177
Iteration 80, loss = 0.0108
--- Epoch 769 / 100000 - 3217 epochs total
Iteration 0, loss = 0.0383
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0129
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0073
--- Epoch 770 / 100000 - 3218 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0041
Iteration 80, loss = 0.0261
--- Epoch 771 / 100000 - 3219 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0153
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0069
--- Epoch 772 / 100000 - 3220 epochs total
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0342
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0064
--- Epoch 773 / 100000 - 3221 epochs total
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0103
--- Epoch 774 / 100000 - 3222 epochs total
Iteration 0, loss = 0.0072
Iteration 20, loss = 0.0095
Iteration 40, loss = 0.0160
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0022
--- Epoch 775 / 100000 - 3223 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0218
Iteration 40, loss = 0.0312
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0101
--- Epoch 776 / 100000 - 3224 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0015
Iteration 80, loss = 0.0040
--- Epoch 777 / 100000 - 3225 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0160
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0084
--- Epoch 778 / 100000 - 3226 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0150
Iteration 80, loss = 0.0026
--- Epoch 779 / 100000 - 3227 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0137
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0032
--- Epoch 780 / 100000 - 3228 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0025
--- Epoch 781 / 100000 - 3229 epochs total
Iteration 0, loss = 0.0111
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0200
Iteration 60, loss = 0.0202
Iteration 80, loss = 0.0018
--- Epoch 782 / 100000 - 3230 epochs total
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0195
Iteration 80, loss = 0.0093
--- Epoch 783 / 100000 - 3231 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0084
--- Epoch 784 / 100000 - 3232 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0128
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0026
--- Epoch 785 / 100000 - 3233 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0177
--- Epoch 786 / 100000 - 3234 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0050
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0466
--- Epoch 787 / 100000 - 3235 epochs total
Iteration 0, loss = 0.0223
Iteration 20, loss = 0.0303
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0385
Iteration 80, loss = 0.0141
--- Epoch 788 / 100000 - 3236 epochs total
Iteration 0, loss = 0.0194
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0128
Iteration 80, loss = 0.0038
--- Epoch 789 / 100000 - 3237 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0133
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0113
--- Epoch 790 / 100000 - 3238 epochs total
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0179
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0183
--- Epoch 791 / 100000 - 3239 epochs total
Iteration 0, loss = 0.0201
Iteration 20, loss = 0.0097
Iteration 40, loss = 0.0224
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0087
--- Epoch 792 / 100000 - 3240 epochs total
Iteration 0, loss = 0.0164
Iteration 20, loss = 0.0165
Iteration 40, loss = 0.0088
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0359
--- Epoch 793 / 100000 - 3241 epochs total
Iteration 0, loss = 0.0156
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0139
Iteration 80, loss = 0.0099
--- Epoch 794 / 100000 - 3242 epochs total
Iteration 0, loss = 0.0294
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0103
Iteration 80, loss = 0.0168
--- Epoch 795 / 100000 - 3243 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0233
Iteration 80, loss = 0.0098
--- Epoch 796 / 100000 - 3244 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0159
Iteration 40, loss = 0.0195
Iteration 60, loss = 0.0190
Iteration 80, loss = 0.0063
--- Epoch 797 / 100000 - 3245 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0179
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0222
--- Epoch 798 / 100000 - 3246 epochs total
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0009
Iteration 80, loss = 0.0104
--- Epoch 799 / 100000 - 3247 epochs total
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0027
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0157
--- Epoch 800 / 100000 - 3248 epochs total
Iteration 0, loss = 0.0122
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0204
Iteration 80, loss = 0.0091
--- Epoch 801 / 100000 - 3249 epochs total
Iteration 0, loss = 0.0330
Iteration 20, loss = 0.0108
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0139
--- Epoch 802 / 100000 - 3250 epochs total
Iteration 0, loss = 0.0104
Iteration 20, loss = 0.0240
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0148
--- Epoch 803 / 100000 - 3251 epochs total
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0184
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0171
--- Epoch 804 / 100000 - 3252 epochs total
Iteration 0, loss = 0.0264
Iteration 20, loss = 0.0424
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0163
--- Epoch 805 / 100000 - 3253 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0134
Iteration 80, loss = 0.0167
--- Epoch 806 / 100000 - 3254 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0059
Iteration 60, loss = 0.0091
Iteration 80, loss = 0.0208
--- Epoch 807 / 100000 - 3255 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0217
Iteration 40, loss = 0.0172
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0170
--- Epoch 808 / 100000 - 3256 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0171
Iteration 40, loss = 0.0225
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0045
--- Epoch 809 / 100000 - 3257 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0100
--- Epoch 810 / 100000 - 3258 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0053
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0062
--- Epoch 811 / 100000 - 3259 epochs total
Iteration 0, loss = 0.0033
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0120
--- Epoch 812 / 100000 - 3260 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0181
Iteration 40, loss = 0.0505
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0384
--- Epoch 813 / 100000 - 3261 epochs total
Iteration 0, loss = 0.0203
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0037
Iteration 80, loss = 0.0247
--- Epoch 814 / 100000 - 3262 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0031
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0200
--- Epoch 815 / 100000 - 3263 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0047
--- Epoch 816 / 100000 - 3264 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0195
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0100
--- Epoch 817 / 100000 - 3265 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0044
--- Epoch 818 / 100000 - 3266 epochs total
Iteration 0, loss = 0.0094
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0106
--- Epoch 819 / 100000 - 3267 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0096
Iteration 80, loss = 0.0017
--- Epoch 820 / 100000 - 3268 epochs total
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0176
Iteration 80, loss = 0.0157
--- Epoch 821 / 100000 - 3269 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0436
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0084
--- Epoch 822 / 100000 - 3270 epochs total
Iteration 0, loss = 0.0040
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0030
--- Epoch 823 / 100000 - 3271 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0013
Iteration 40, loss = 0.0228
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0101
--- Epoch 824 / 100000 - 3272 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0582
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0585
--- Epoch 825 / 100000 - 3273 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0259
Iteration 60, loss = 0.0119
Iteration 80, loss = 0.0052
--- Epoch 826 / 100000 - 3274 epochs total
Iteration 0, loss = 0.0075
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0075
Iteration 60, loss = 0.0148
Iteration 80, loss = 0.0035
--- Epoch 827 / 100000 - 3275 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0219
Iteration 40, loss = 0.0182
Iteration 60, loss = 0.0286
Iteration 80, loss = 0.0753
--- Epoch 828 / 100000 - 3276 epochs total
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0089
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0030
--- Epoch 829 / 100000 - 3277 epochs total
Iteration 0, loss = 0.0225
Iteration 20, loss = 0.0361
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0057
Iteration 80, loss = 0.0039
--- Epoch 830 / 100000 - 3278 epochs total
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0175
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0301
--- Epoch 831 / 100000 - 3279 epochs total
Iteration 0, loss = 0.0426
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0025
Iteration 80, loss = 0.0173
--- Epoch 832 / 100000 - 3280 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0187
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0048
--- Epoch 833 / 100000 - 3281 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0313
Iteration 80, loss = 0.0061
--- Epoch 834 / 100000 - 3282 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0099
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0056
Iteration 80, loss = 0.0078
--- Epoch 835 / 100000 - 3283 epochs total
Iteration 0, loss = 0.0039
Iteration 20, loss = 0.0216
Iteration 40, loss = 0.0121
Iteration 60, loss = 0.0043
Iteration 80, loss = 0.0041
--- Epoch 836 / 100000 - 3284 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0077
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0317
Iteration 80, loss = 0.0047
--- Epoch 837 / 100000 - 3285 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0148
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0135
--- Epoch 838 / 100000 - 3286 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0177
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0106
--- Epoch 839 / 100000 - 3287 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0087
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0093
Iteration 80, loss = 0.0053
--- Epoch 840 / 100000 - 3288 epochs total
Iteration 0, loss = 0.0208
Iteration 20, loss = 0.0147
Iteration 40, loss = 0.0077
Iteration 60, loss = 0.0156
Iteration 80, loss = 0.0049
--- Epoch 841 / 100000 - 3289 epochs total
Iteration 0, loss = 0.0499
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0081
--- Epoch 842 / 100000 - 3290 epochs total
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0256
Iteration 60, loss = 0.0106
Iteration 80, loss = 0.0056
--- Epoch 843 / 100000 - 3291 epochs total
Iteration 0, loss = 0.0088
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0036
Iteration 60, loss = 0.0028
Iteration 80, loss = 0.0433
--- Epoch 844 / 100000 - 3292 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0527
Iteration 40, loss = 0.0076
Iteration 60, loss = 0.0084
Iteration 80, loss = 0.0156
--- Epoch 845 / 100000 - 3293 epochs total
Iteration 0, loss = 0.0344
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0023
--- Epoch 846 / 100000 - 3294 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0229
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0315
Iteration 80, loss = 0.0350
--- Epoch 847 / 100000 - 3295 epochs total
Iteration 0, loss = 0.0049
Iteration 20, loss = 0.0044
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0061
--- Epoch 848 / 100000 - 3296 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0196
Iteration 40, loss = 0.0070
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0050
--- Epoch 849 / 100000 - 3297 epochs total
Iteration 0, loss = 0.0046
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0014
--- Epoch 850 / 100000 - 3298 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0121
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0092
--- Epoch 851 / 100000 - 3299 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0074
Iteration 40, loss = 0.0047
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0041
--- Epoch 852 / 100000 - 3300 epochs total
Iteration 0, loss = 0.0108
Iteration 20, loss = 0.0152
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0079
Iteration 80, loss = 0.0062
--- Epoch 853 / 100000 - 3301 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0112
Iteration 60, loss = 0.0455
Iteration 80, loss = 0.0024
--- Epoch 854 / 100000 - 3302 epochs total
Iteration 0, loss = 0.0112
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0255
Iteration 80, loss = 0.0051
--- Epoch 855 / 100000 - 3303 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0057
--- Epoch 856 / 100000 - 3304 epochs total
Iteration 0, loss = 0.0722
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0095
Iteration 80, loss = 0.0050
--- Epoch 857 / 100000 - 3305 epochs total
Iteration 0, loss = 0.0128
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0309
--- Epoch 858 / 100000 - 3306 epochs total
Iteration 0, loss = 0.0022
Iteration 20, loss = 0.0079
Iteration 40, loss = 0.0045
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0082
--- Epoch 859 / 100000 - 3307 epochs total
Iteration 0, loss = 0.0128
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0020
--- Epoch 860 / 100000 - 3308 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0033
Iteration 40, loss = 0.0266
Iteration 60, loss = 0.0390
Iteration 80, loss = 0.0225
--- Epoch 861 / 100000 - 3309 epochs total
Iteration 0, loss = 0.0098
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0112
--- Epoch 862 / 100000 - 3310 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0107
Iteration 80, loss = 0.0064
--- Epoch 863 / 100000 - 3311 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0286
Iteration 40, loss = 0.0132
Iteration 60, loss = 0.0241
Iteration 80, loss = 0.0191
--- Epoch 864 / 100000 - 3312 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0156
--- Epoch 865 / 100000 - 3313 epochs total
Iteration 0, loss = 0.0125
Iteration 20, loss = 0.0099
Iteration 40, loss = 0.0017
Iteration 60, loss = 0.0017
Iteration 80, loss = 0.0012
--- Epoch 866 / 100000 - 3314 epochs total
Iteration 0, loss = 0.0116
Iteration 20, loss = 0.0121
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0045
--- Epoch 867 / 100000 - 3315 epochs total
Iteration 0, loss = 0.0176
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0375
Iteration 60, loss = 0.0189
Iteration 80, loss = 0.0081
--- Epoch 868 / 100000 - 3316 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0144
--- Epoch 869 / 100000 - 3317 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0154
Iteration 80, loss = 0.0031
--- Epoch 870 / 100000 - 3318 epochs total
Iteration 0, loss = 0.0079
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0082
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0081
--- Epoch 871 / 100000 - 3319 epochs total
Iteration 0, loss = 0.0236
Iteration 20, loss = 0.0035
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0295
Iteration 80, loss = 0.0060
--- Epoch 872 / 100000 - 3320 epochs total
Iteration 0, loss = 0.0210
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0144
--- Epoch 873 / 100000 - 3321 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0019
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0022
--- Epoch 874 / 100000 - 3322 epochs total
Iteration 0, loss = 0.0153
Iteration 20, loss = 0.0067
Iteration 40, loss = 0.0113
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0027
--- Epoch 875 / 100000 - 3323 epochs total
Iteration 0, loss = 0.0107
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0388
Iteration 60, loss = 0.0051
Iteration 80, loss = 0.0019
--- Epoch 876 / 100000 - 3324 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0431
--- Epoch 877 / 100000 - 3325 epochs total
Iteration 0, loss = 0.0020
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0193
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0011
--- Epoch 878 / 100000 - 3326 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0071
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0507
Iteration 80, loss = 0.0072
--- Epoch 879 / 100000 - 3327 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0113
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0168
--- Epoch 880 / 100000 - 3328 epochs total
Iteration 0, loss = 0.0084
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0024
--- Epoch 881 / 100000 - 3329 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0056
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0080
--- Epoch 882 / 100000 - 3330 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0231
Iteration 80, loss = 0.0049
--- Epoch 883 / 100000 - 3331 epochs total
Iteration 0, loss = 0.0265
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0012
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0033
--- Epoch 884 / 100000 - 3332 epochs total
Iteration 0, loss = 0.0061
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0151
Iteration 80, loss = 0.0031
--- Epoch 885 / 100000 - 3333 epochs total
Iteration 0, loss = 0.0089
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0023
Iteration 60, loss = 0.0149
Iteration 80, loss = 0.0098
--- Epoch 886 / 100000 - 3334 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0096
--- Epoch 887 / 100000 - 3335 epochs total
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0102
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0101
--- Epoch 888 / 100000 - 3336 epochs total
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0139
Iteration 40, loss = 0.0222
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0123
--- Epoch 889 / 100000 - 3337 epochs total
Iteration 0, loss = 0.0164
Iteration 20, loss = 0.0308
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0044
Iteration 80, loss = 0.0042
--- Epoch 890 / 100000 - 3338 epochs total
Iteration 0, loss = 0.0047
Iteration 20, loss = 0.0206
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0104
Iteration 80, loss = 0.0101
--- Epoch 891 / 100000 - 3339 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0124
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0134
Iteration 80, loss = 0.0115
--- Epoch 892 / 100000 - 3340 epochs total
Iteration 0, loss = 0.0019
Iteration 20, loss = 0.0115
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0137
--- Epoch 893 / 100000 - 3341 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0025
--- Epoch 894 / 100000 - 3342 epochs total
Iteration 0, loss = 0.0056
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0105
Iteration 80, loss = 0.0010
--- Epoch 895 / 100000 - 3343 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0580
--- Epoch 896 / 100000 - 3344 epochs total
Iteration 0, loss = 0.0135
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0492
Iteration 60, loss = 0.0134
Iteration 80, loss = 0.0056
--- Epoch 897 / 100000 - 3345 epochs total
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0028
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0234
Iteration 80, loss = 0.0238
--- Epoch 898 / 100000 - 3346 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0076
Iteration 40, loss = 0.0026
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0036
--- Epoch 899 / 100000 - 3347 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0010
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0066
--- Epoch 900 / 100000 - 3348 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0012
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0029
Iteration 80, loss = 0.0024
--- Epoch 901 / 100000 - 3349 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0188
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0066
--- Epoch 902 / 100000 - 3350 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0042
--- Epoch 903 / 100000 - 3351 epochs total
Iteration 0, loss = 0.0141
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0061
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0025
--- Epoch 904 / 100000 - 3352 epochs total
Iteration 0, loss = 0.0153
Iteration 20, loss = 0.0147
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0108
--- Epoch 905 / 100000 - 3353 epochs total
Iteration 0, loss = 0.0023
Iteration 20, loss = 0.0268
Iteration 40, loss = 0.0025
Iteration 60, loss = 0.0081
Iteration 80, loss = 0.0133
--- Epoch 906 / 100000 - 3354 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0066
Iteration 40, loss = 0.0106
Iteration 60, loss = 0.0133
Iteration 80, loss = 0.0032
--- Epoch 907 / 100000 - 3355 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0068
Iteration 80, loss = 0.0024
--- Epoch 908 / 100000 - 3356 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0722
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0017
--- Epoch 909 / 100000 - 3357 epochs total
Iteration 0, loss = 0.0586
Iteration 20, loss = 0.0081
Iteration 40, loss = 0.0110
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0189
--- Epoch 910 / 100000 - 3358 epochs total
Iteration 0, loss = 0.0128
Iteration 20, loss = 0.0128
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0053
Iteration 80, loss = 0.0051
--- Epoch 911 / 100000 - 3359 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0075
Iteration 40, loss = 0.0292
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0042
--- Epoch 912 / 100000 - 3360 epochs total
Iteration 0, loss = 0.0015
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0369
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0075
--- Epoch 913 / 100000 - 3361 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0159
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0023
--- Epoch 914 / 100000 - 3362 epochs total
Iteration 0, loss = 0.0053
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0168
Iteration 80, loss = 0.0040
--- Epoch 915 / 100000 - 3363 epochs total
Iteration 0, loss = 0.0036
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0058
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0120
--- Epoch 916 / 100000 - 3364 epochs total
Iteration 0, loss = 0.0204
Iteration 20, loss = 0.0183
Iteration 40, loss = 0.0087
Iteration 60, loss = 0.0100
Iteration 80, loss = 0.0230
--- Epoch 917 / 100000 - 3365 epochs total
Iteration 0, loss = 0.0054
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0351
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0162
--- Epoch 918 / 100000 - 3366 epochs total
Iteration 0, loss = 0.0225
Iteration 20, loss = 0.0113
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0189
Iteration 80, loss = 0.0012
--- Epoch 919 / 100000 - 3367 epochs total
Iteration 0, loss = 0.0070
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0260
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0083
--- Epoch 920 / 100000 - 3368 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0052
--- Epoch 921 / 100000 - 3369 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0226
Iteration 40, loss = 0.0097
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0043
--- Epoch 922 / 100000 - 3370 epochs total
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0290
Iteration 80, loss = 0.0141
--- Epoch 923 / 100000 - 3371 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0043
--- Epoch 924 / 100000 - 3372 epochs total
Iteration 0, loss = 0.0038
Iteration 20, loss = 0.0195
Iteration 40, loss = 0.0241
Iteration 60, loss = 0.0026
Iteration 80, loss = 0.0073
--- Epoch 925 / 100000 - 3373 epochs total
Iteration 0, loss = 0.0192
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0670
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0041
--- Epoch 926 / 100000 - 3374 epochs total
Iteration 0, loss = 0.0275
Iteration 20, loss = 0.0114
Iteration 40, loss = 0.0824
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0384
--- Epoch 927 / 100000 - 3375 epochs total
Iteration 0, loss = 0.0138
Iteration 20, loss = 0.0186
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0014
Iteration 80, loss = 0.0072
--- Epoch 928 / 100000 - 3376 epochs total
Iteration 0, loss = 0.0081
Iteration 20, loss = 0.0026
Iteration 40, loss = 0.0103
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0116
--- Epoch 929 / 100000 - 3377 epochs total
Iteration 0, loss = 0.0093
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0062
--- Epoch 930 / 100000 - 3378 epochs total
Iteration 0, loss = 0.0126
Iteration 20, loss = 0.0322
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0071
Iteration 80, loss = 0.0015
--- Epoch 931 / 100000 - 3379 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0070
Iteration 40, loss = 0.0018
Iteration 60, loss = 0.0078
Iteration 80, loss = 0.0069
--- Epoch 932 / 100000 - 3380 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0206
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0016
Iteration 80, loss = 0.0054
--- Epoch 933 / 100000 - 3381 epochs total
Iteration 0, loss = 0.0143
Iteration 20, loss = 0.0348
Iteration 40, loss = 0.0083
Iteration 60, loss = 0.0066
Iteration 80, loss = 0.0087
--- Epoch 934 / 100000 - 3382 epochs total
Iteration 0, loss = 0.0258
Iteration 20, loss = 0.0027
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0182
Iteration 80, loss = 0.0035
--- Epoch 935 / 100000 - 3383 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0111
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0045
Iteration 80, loss = 0.0045
--- Epoch 936 / 100000 - 3384 epochs total
Iteration 0, loss = 0.0138
Iteration 20, loss = 0.0062
Iteration 40, loss = 0.0016
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0618
--- Epoch 937 / 100000 - 3385 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0054
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0152
Iteration 80, loss = 0.0069
--- Epoch 938 / 100000 - 3386 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0167
Iteration 60, loss = 0.0118
Iteration 80, loss = 0.0097
--- Epoch 939 / 100000 - 3387 epochs total
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0034
Iteration 40, loss = 0.0211
Iteration 60, loss = 0.0101
Iteration 80, loss = 0.0073
--- Epoch 940 / 100000 - 3388 epochs total
Iteration 0, loss = 0.0106
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0044
Iteration 60, loss = 0.0059
Iteration 80, loss = 0.0136
--- Epoch 941 / 100000 - 3389 epochs total
Iteration 0, loss = 0.0402
Iteration 20, loss = 0.0063
Iteration 40, loss = 0.0130
Iteration 60, loss = 0.0012
Iteration 80, loss = 0.0038
--- Epoch 942 / 100000 - 3390 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0118
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0074
Iteration 80, loss = 0.0030
--- Epoch 943 / 100000 - 3391 epochs total
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0041
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0040
--- Epoch 944 / 100000 - 3392 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0180
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0046
--- Epoch 945 / 100000 - 3393 epochs total
Iteration 0, loss = 0.0360
Iteration 20, loss = 0.0153
Iteration 40, loss = 0.0189
Iteration 60, loss = 0.0011
Iteration 80, loss = 0.0123
--- Epoch 946 / 100000 - 3394 epochs total
Iteration 0, loss = 0.0821
Iteration 20, loss = 0.0014
Iteration 40, loss = 0.0105
Iteration 60, loss = 0.0087
Iteration 80, loss = 0.0065
--- Epoch 947 / 100000 - 3395 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0194
Iteration 40, loss = 0.0124
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0098
--- Epoch 948 / 100000 - 3396 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0160
Iteration 60, loss = 0.0271
Iteration 80, loss = 0.0117
--- Epoch 949 / 100000 - 3397 epochs total
Iteration 0, loss = 0.0057
Iteration 20, loss = 0.0029
Iteration 40, loss = 0.0096
Iteration 60, loss = 0.0148
Iteration 80, loss = 0.0070
--- Epoch 950 / 100000 - 3398 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0111
Iteration 60, loss = 0.0024
Iteration 80, loss = 0.0014
--- Epoch 951 / 100000 - 3399 epochs total
Iteration 0, loss = 0.0139
Iteration 20, loss = 0.0022
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0121
--- Epoch 952 / 100000 - 3400 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0228
Iteration 60, loss = 0.0214
Iteration 80, loss = 0.0119
--- Epoch 953 / 100000 - 3401 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0041
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0022
--- Epoch 954 / 100000 - 3402 epochs total
Iteration 0, loss = 0.0016
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0020
Iteration 60, loss = 0.0063
Iteration 80, loss = 0.0151
--- Epoch 955 / 100000 - 3403 epochs total
Iteration 0, loss = 0.0188
Iteration 20, loss = 0.0105
Iteration 40, loss = 0.0068
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0147
--- Epoch 956 / 100000 - 3404 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0101
Iteration 60, loss = 0.0140
Iteration 80, loss = 0.0068
--- Epoch 957 / 100000 - 3405 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0036
Iteration 80, loss = 0.0272
--- Epoch 958 / 100000 - 3406 epochs total
Iteration 0, loss = 0.0067
Iteration 20, loss = 0.0313
Iteration 40, loss = 0.0371
Iteration 60, loss = 0.0102
Iteration 80, loss = 0.0048
--- Epoch 959 / 100000 - 3407 epochs total
Iteration 0, loss = 0.0042
Iteration 20, loss = 0.0015
Iteration 40, loss = 0.0063
Iteration 60, loss = 0.0198
Iteration 80, loss = 0.0053
--- Epoch 960 / 100000 - 3408 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0069
Iteration 40, loss = 0.0039
Iteration 60, loss = 0.0020
Iteration 80, loss = 0.0040
--- Epoch 961 / 100000 - 3409 epochs total
Iteration 0, loss = 0.0055
Iteration 20, loss = 0.0148
Iteration 40, loss = 0.0098
Iteration 60, loss = 0.0030
Iteration 80, loss = 0.0037
--- Epoch 962 / 100000 - 3410 epochs total
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0141
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0059
--- Epoch 963 / 100000 - 3411 epochs total
Iteration 0, loss = 0.0027
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0061
Iteration 80, loss = 0.0228
--- Epoch 964 / 100000 - 3412 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0021
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0270
Iteration 80, loss = 0.0102
--- Epoch 965 / 100000 - 3413 epochs total
Iteration 0, loss = 0.0060
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0054
Iteration 80, loss = 0.0119
--- Epoch 966 / 100000 - 3414 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0107
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0088
--- Epoch 967 / 100000 - 3415 epochs total
Iteration 0, loss = 0.0324
Iteration 20, loss = 0.0040
Iteration 40, loss = 0.0565
Iteration 60, loss = 0.0069
Iteration 80, loss = 0.0097
--- Epoch 968 / 100000 - 3416 epochs total
Iteration 0, loss = 0.0127
Iteration 20, loss = 0.0024
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0172
Iteration 80, loss = 0.0362
--- Epoch 969 / 100000 - 3417 epochs total
Iteration 0, loss = 0.0119
Iteration 20, loss = 0.0059
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0035
--- Epoch 970 / 100000 - 3418 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0178
Iteration 40, loss = 0.0035
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0076
--- Epoch 971 / 100000 - 3419 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0042
Iteration 40, loss = 0.0079
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0056
--- Epoch 972 / 100000 - 3420 epochs total
Iteration 0, loss = 0.0127
Iteration 20, loss = 0.0116
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0147
Iteration 80, loss = 0.0207
--- Epoch 973 / 100000 - 3421 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0046
Iteration 40, loss = 0.0049
Iteration 60, loss = 0.0080
Iteration 80, loss = 0.0021
--- Epoch 974 / 100000 - 3422 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0058
Iteration 40, loss = 0.0029
Iteration 60, loss = 0.0023
Iteration 80, loss = 0.0083
--- Epoch 975 / 100000 - 3423 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0053
Iteration 40, loss = 0.0009
Iteration 60, loss = 0.0264
Iteration 80, loss = 0.0042
--- Epoch 976 / 100000 - 3424 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0078
Iteration 60, loss = 0.0133
Iteration 80, loss = 0.0088
--- Epoch 977 / 100000 - 3425 epochs total
Iteration 0, loss = 0.0073
Iteration 20, loss = 0.0299
Iteration 40, loss = 0.0142
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0108
--- Epoch 978 / 100000 - 3426 epochs total
Iteration 0, loss = 0.0028
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0207
Iteration 80, loss = 0.0235
--- Epoch 979 / 100000 - 3427 epochs total
Iteration 0, loss = 0.0170
Iteration 20, loss = 0.0057
Iteration 40, loss = 0.0416
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0027
--- Epoch 980 / 100000 - 3428 epochs total
Iteration 0, loss = 0.0021
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0238
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0067
--- Epoch 981 / 100000 - 3429 epochs total
Iteration 0, loss = 0.0123
Iteration 20, loss = 0.0247
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0102
Iteration 80, loss = 0.0089
--- Epoch 982 / 100000 - 3430 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0028
Iteration 60, loss = 0.0281
Iteration 80, loss = 0.0031
--- Epoch 983 / 100000 - 3431 epochs total
Iteration 0, loss = 0.0010
Iteration 20, loss = 0.0101
Iteration 40, loss = 0.0086
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0149
--- Epoch 984 / 100000 - 3432 epochs total
Iteration 0, loss = 0.0044
Iteration 20, loss = 0.0106
Iteration 40, loss = 0.0030
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0116
--- Epoch 985 / 100000 - 3433 epochs total
Iteration 0, loss = 0.0187
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0108
Iteration 60, loss = 0.0345
Iteration 80, loss = 0.0039
--- Epoch 986 / 100000 - 3434 epochs total
Iteration 0, loss = 0.0026
Iteration 20, loss = 0.0164
Iteration 40, loss = 0.0092
Iteration 60, loss = 0.0180
Iteration 80, loss = 0.0123
--- Epoch 987 / 100000 - 3435 epochs total
Iteration 0, loss = 0.0187
Iteration 20, loss = 0.0055
Iteration 40, loss = 0.0032
Iteration 60, loss = 0.0097
Iteration 80, loss = 0.0321
--- Epoch 988 / 100000 - 3436 epochs total
Iteration 0, loss = 0.0096
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0054
--- Epoch 989 / 100000 - 3437 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0973
--- Epoch 990 / 100000 - 3438 epochs total
Iteration 0, loss = 0.0213
Iteration 20, loss = 0.0088
Iteration 40, loss = 0.0022
Iteration 60, loss = 0.0240
Iteration 80, loss = 0.0207
--- Epoch 991 / 100000 - 3439 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0123
Iteration 40, loss = 0.0034
Iteration 60, loss = 0.0048
Iteration 80, loss = 0.0045
--- Epoch 992 / 100000 - 3440 epochs total
Iteration 0, loss = 0.0050
Iteration 20, loss = 0.0068
Iteration 40, loss = 0.0197
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0062
--- Epoch 993 / 100000 - 3441 epochs total
Iteration 0, loss = 0.0249
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0129
Iteration 60, loss = 0.0065
Iteration 80, loss = 0.0192
--- Epoch 994 / 100000 - 3442 epochs total
Iteration 0, loss = 0.0030
Iteration 20, loss = 0.0100
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0039
--- Epoch 995 / 100000 - 3443 epochs total
Iteration 0, loss = 0.0058
Iteration 20, loss = 0.0080
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0162
Iteration 80, loss = 0.0034
--- Epoch 996 / 100000 - 3444 epochs total
Iteration 0, loss = 0.0065
Iteration 20, loss = 0.0189
Iteration 40, loss = 0.0069
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0068
--- Epoch 997 / 100000 - 3445 epochs total
Iteration 0, loss = 0.0124
Iteration 20, loss = 0.0010
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0063
--- Epoch 998 / 100000 - 3446 epochs total
Iteration 0, loss = 0.0416
Iteration 20, loss = 0.0546
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0077
Iteration 80, loss = 0.0558
--- Epoch 999 / 100000 - 3447 epochs total
Iteration 0, loss = 0.0012
Iteration 20, loss = 0.0353
Iteration 40, loss = 0.0040
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0123
--- Epoch 1000 / 100000 - 3448 epochs total
Iteration 0, loss = 0.0066
Iteration 20, loss = 0.0052
Iteration 40, loss = 0.0056
Iteration 60, loss = 0.0141
Iteration 80, loss = 0.0046
--- Epoch 1001 / 100000 - 3449 epochs total
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0096
Iteration 40, loss = 0.0118
Iteration 60, loss = 0.0295
Iteration 80, loss = 0.0140
--- Epoch 1002 / 100000 - 3450 epochs total
Iteration 0, loss = 0.0446
Iteration 20, loss = 0.0032
Iteration 40, loss = 0.0062
Iteration 60, loss = 0.0019
Iteration 80, loss = 0.0172
--- Epoch 1003 / 100000 - 3451 epochs total
Iteration 0, loss = 0.0024
Iteration 20, loss = 0.0018
Iteration 40, loss = 0.0013
Iteration 60, loss = 0.0083
Iteration 80, loss = 0.0054
--- Epoch 1004 / 100000 - 3452 epochs total
Iteration 0, loss = 0.0029
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0033
Iteration 60, loss = 0.0033
Iteration 80, loss = 0.0150
--- Epoch 1005 / 100000 - 3453 epochs total
Iteration 0, loss = 0.0037
Iteration 20, loss = 0.0135
Iteration 40, loss = 0.0160
Iteration 60, loss = 0.0039
Iteration 80, loss = 0.0054
--- Epoch 1006 / 100000 - 3454 epochs total
Iteration 0, loss = 0.0017
Iteration 20, loss = 0.0017
Iteration 40, loss = 0.0067
Iteration 60, loss = 0.0042
Iteration 80, loss = 0.0112
--- Epoch 1007 / 100000 - 3455 epochs total
Iteration 0, loss = 0.0113
Iteration 20, loss = 0.0466
Iteration 40, loss = 0.0091
Iteration 60, loss = 0.0047
Iteration 80, loss = 0.0131
--- Epoch 1008 / 100000 - 3456 epochs total
Iteration 0, loss = 0.0110
Iteration 20, loss = 0.0072
Iteration 40, loss = 0.0107
Iteration 60, loss = 0.0129
Iteration 80, loss = 0.0067
--- Epoch 1009 / 100000 - 3457 epochs total
Iteration 0, loss = 0.0085
Iteration 20, loss = 0.0019
Iteration 40, loss = 0.0178
Iteration 60, loss = 0.0101
Iteration 80, loss = 0.0169
--- Epoch 1010 / 100000 - 3458 epochs total
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0125
Iteration 40, loss = 0.0065
Iteration 60, loss = 0.0058
Iteration 80, loss = 0.0063
--- Epoch 1011 / 100000 - 3459 epochs total
Iteration 0, loss = 0.0129
Iteration 20, loss = 0.0016
Iteration 40, loss = 0.0054
Iteration 60, loss = 0.0027
Iteration 80, loss = 0.0082
--- Epoch 1012 / 100000 - 3460 epochs total
Iteration 0, loss = 0.0041
Iteration 20, loss = 0.0037
Iteration 40, loss = 0.0072
Iteration 60, loss = 0.0132
Iteration 80, loss = 0.0255
--- Epoch 1013 / 100000 - 3461 epochs total
Iteration 0, loss = 0.0214
Iteration 20, loss = 0.0045
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0090
Iteration 80, loss = 0.0095
--- Epoch 1014 / 100000 - 3462 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0130
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0142
Iteration 80, loss = 0.0050
--- Epoch 1015 / 100000 - 3463 epochs total
Iteration 0, loss = 0.0064
Iteration 20, loss = 0.0085
Iteration 40, loss = 0.0115
Iteration 60, loss = 0.0060
Iteration 80, loss = 0.0077
--- Epoch 1016 / 100000 - 3464 epochs total
Iteration 0, loss = 0.0034
Iteration 20, loss = 0.0281
Iteration 40, loss = 0.0055
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0027
--- Epoch 1017 / 100000 - 3465 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0100
Iteration 60, loss = 0.0124
Iteration 80, loss = 0.0250
--- Epoch 1018 / 100000 - 3466 epochs total
Iteration 0, loss = 0.0032
Iteration 20, loss = 0.0038
Iteration 40, loss = 0.0110
Iteration 60, loss = 0.0127
Iteration 80, loss = 0.0160
--- Epoch 1019 / 100000 - 3467 epochs total
Iteration 0, loss = 0.0102
Iteration 20, loss = 0.0061
Iteration 40, loss = 0.0043
Iteration 60, loss = 0.0177
Iteration 80, loss = 0.0135
--- Epoch 1020 / 100000 - 3468 epochs total
Iteration 0, loss = 0.0148
Iteration 20, loss = 0.0060
Iteration 40, loss = 0.0204
Iteration 60, loss = 0.0179
Iteration 80, loss = 0.0055
--- Epoch 1021 / 100000 - 3469 epochs total
Iteration 0, loss = 0.0059
Iteration 20, loss = 0.0030
Iteration 40, loss = 0.0093
Iteration 60, loss = 0.0032
Iteration 80, loss = 0.0046
--- Epoch 1022 / 100000 - 3470 epochs total
Iteration 0, loss = 0.0199
Iteration 20, loss = 0.0025
Iteration 40, loss = 0.0042
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0054
--- Epoch 1023 / 100000 - 3471 epochs total
Iteration 0, loss = 0.0068
Iteration 20, loss = 0.0145
Iteration 40, loss = 0.0052
Iteration 60, loss = 0.0076
Iteration 80, loss = 0.0108
--- Epoch 1024 / 100000 - 3472 epochs total
Iteration 0, loss = 0.0043
Iteration 20, loss = 0.0011
Iteration 40, loss = 0.0064
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0072
--- Epoch 1025 / 100000 - 3473 epochs total
Iteration 0, loss = 0.0142
Iteration 20, loss = 0.0098
Iteration 40, loss = 0.0638
Iteration 60, loss = 0.0075
Iteration 80, loss = 0.0031
--- Epoch 1026 / 100000 - 3474 epochs total
Iteration 0, loss = 0.0183
Iteration 20, loss = 0.0047
Iteration 40, loss = 0.0134
Iteration 60, loss = 0.0067
Iteration 80, loss = 0.0049
--- Epoch 1027 / 100000 - 3475 epochs total
Iteration 0, loss = 0.0158
Iteration 20, loss = 0.0092
Iteration 40, loss = 0.0024
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0073
--- Epoch 1028 / 100000 - 3476 epochs total
Iteration 0, loss = 0.0174
Iteration 20, loss = 0.0043
Iteration 40, loss = 0.0189
Iteration 60, loss = 0.0049
Iteration 80, loss = 0.0059
--- Epoch 1029 / 100000 - 3477 epochs total
Iteration 0, loss = 0.0045
Iteration 20, loss = 0.0339
Iteration 40, loss = 0.0187
Iteration 60, loss = 0.0109
Iteration 80, loss = 0.0478
--- Epoch 1030 / 100000 - 3478 epochs total
Iteration 0, loss = 0.0225
Iteration 20, loss = 0.0031
Iteration 40, loss = 0.0046
Iteration 60, loss = 0.0088
Iteration 80, loss = 0.0044
--- Epoch 1031 / 100000 - 3479 epochs total
Iteration 0, loss = 0.0282
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0181
Iteration 80, loss = 0.0140
--- Epoch 1032 / 100000 - 3480 epochs total
Iteration 0, loss = 0.0035
Iteration 20, loss = 0.0142
Iteration 40, loss = 0.0208
Iteration 60, loss = 0.0114
Iteration 80, loss = 0.0017
--- Epoch 1033 / 100000 - 3481 epochs total
Iteration 0, loss = 0.0120
Iteration 20, loss = 0.0110
Iteration 40, loss = 0.0015
Iteration 60, loss = 0.0192
Iteration 80, loss = 0.0161
--- Epoch 1034 / 100000 - 3482 epochs total
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0372
Iteration 40, loss = 0.0060
Iteration 60, loss = 0.0034
Iteration 80, loss = 0.0494
--- Epoch 1035 / 100000 - 3483 epochs total
Iteration 0, loss = 0.0031
Iteration 20, loss = 0.0039
Iteration 40, loss = 0.0178
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0050
--- Epoch 1036 / 100000 - 3484 epochs total
Iteration 0, loss = 0.0158
Iteration 20, loss = 0.0117
Iteration 40, loss = 0.0125
Iteration 60, loss = 0.0038
Iteration 80, loss = 0.0041
--- Epoch 1037 / 100000 - 3485 epochs total
Iteration 0, loss = 0.0233
Iteration 20, loss = 0.0123
Iteration 40, loss = 0.0021
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0320
--- Epoch 1038 / 100000 - 3486 epochs total
Iteration 0, loss = 0.0014
Iteration 20, loss = 0.0131
Iteration 40, loss = 0.0038
Iteration 60, loss = 0.0031
Iteration 80, loss = 0.0027
--- Epoch 1039 / 100000 - 3487 epochs total
Iteration 0, loss = 0.0180
Iteration 20, loss = 0.0020
Iteration 40, loss = 0.0272
Iteration 60, loss = 0.0021
Iteration 80, loss = 0.0257
--- Epoch 1040 / 100000 - 3488 epochs total
Iteration 0, loss = 0.0080
Iteration 20, loss = 0.0048
Iteration 40, loss = 0.0117
Iteration 60, loss = 0.0040
Iteration 80, loss = 0.0066
--- Epoch 1041 / 100000 - 3489 epochs total
Iteration 0, loss = 0.0025
Iteration 20, loss = 0.0023
Iteration 40, loss = 0.0037
Iteration 60, loss = 0.0092
Iteration 80, loss = 0.0087
--- Epoch 1042 / 100000 - 3490 epochs total
Iteration 0, loss = 0.0078
Iteration 20, loss = 0.0051
Iteration 40, loss = 0.0446
Iteration 60, loss = 0.0052
Iteration 80, loss = 0.0070
--- Epoch 1043 / 100000 - 3491 epochs total
Iteration 0, loss = 0.0389
Iteration 20, loss = 0.0149
Iteration 40, loss = 0.0057
Iteration 60, loss = 0.0240
Iteration 80, loss = 0.0079
--- Epoch 1044 / 100000 - 3492 epochs total
Iteration 0, loss = 0.0087
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0048
Iteration 60, loss = 0.0046
Iteration 80, loss = 0.0066
--- Epoch 1045 / 100000 - 3493 epochs total
Iteration 0, loss = 0.0155
Iteration 20, loss = 0.0083
Iteration 40, loss = 0.0073
Iteration 60, loss = 0.0022
Iteration 80, loss = 0.0115
--- Epoch 1046 / 100000 - 3494 epochs total
Iteration 0, loss = 0.0206
Iteration 20, loss = 0.0274
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0694
Iteration 80, loss = 0.0032
--- Epoch 1047 / 100000 - 3495 epochs total
Iteration 0, loss = 0.0063
Iteration 20, loss = 0.0073
Iteration 40, loss = 0.0137
Iteration 60, loss = 0.0050
Iteration 80, loss = 0.0056
--- Epoch 1048 / 100000 - 3496 epochs total
Iteration 0, loss = 0.0114
Iteration 20, loss = 0.0225
Iteration 40, loss = 0.0014
Iteration 60, loss = 0.0086
Iteration 80, loss = 0.0084
--- Epoch 1049 / 100000 - 3497 epochs total
Iteration 0, loss = 0.0099
Iteration 20, loss = 0.0331
Iteration 40, loss = 0.0239
Iteration 60, loss = 0.0113
Iteration 80, loss = 0.0482
--- Epoch 1050 / 100000 - 3498 epochs total
Iteration 0, loss = 0.0076
Iteration 20, loss = 0.0328
Iteration 40, loss = 0.0095
Iteration 60, loss = 0.0157
Iteration 80, loss = 0.0235
--- Epoch 1051 / 100000 - 3499 epochs total
Iteration 0, loss = 0.0118
Iteration 20, loss = 0.0093
Iteration 40, loss = 0.0080
Iteration 60, loss = 0.0035
Iteration 80, loss = 0.0107
--- Epoch 1052 / 100000 - 3500 epochs total
Iteration 0, loss = 0.0083
Iteration 20, loss = 0.0104
Iteration 40, loss = 0.0050
Iteration 60, loss = 0.0475
Iteration 80, loss = 0.0050
---------------------------------------------------------------------------
KeyboardInterrupt                         Traceback (most recent call last)
<ipython-input-161-ca87b0d12256> in <module>
----> 1 train(model14, optimizer, epochs=100000, x_train=data["X_train"],  y_train=data["y_train"], criterion=nn.MSELoss())

<ipython-input-18-95dee9c67ab2> in train(model, optimizer, epochs, x_train, y_train, criterion)
     34             # Zero out all of the gradients for the variables which the optimizer
     35             # will update.
---> 36             optimizer.zero_grad()
     37 
     38             # This is the backwards pass: compute the gradient of the loss with

/opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/optim/optimizer.py in zero_grad(self)
    170                 if p.grad is not None:
    171                     p.grad.detach_()
--> 172                     p.grad.zero_()
    173 
    174     def step(self, closure):

KeyboardInterrupt: 
In [167]:
testModel(model14, x_test=data["X_test"], y_test=data["y_test"], criterion=nn.MSELoss())
In [ ]: